[igt-dev] [PATCH i-g-t 1/4] lib/i915/perf: Add i915_perf library

Umesh Nerlige Ramappa umesh.nerlige.ramappa at intel.com
Sat Feb 15 01:11:12 UTC 2020


From: Lionel Landwerlin <lionel.g.landwerlin at intel.com>

Add perf OA metrics configurations that are used by the perf tools to
capture OA data and used by GPUvis.

v2: (Umesh)
- prevent generation of codegen.pyc
- rebase build fixes for igt lists

Signed-off-by: Lionel Landwerlin <lionel.g.landwerlin at intel.com>
Signed-off-by: Umesh Nerlige Ramappa <umesh.nerlige.ramappa at intel.com>
---
 lib/i915-perf.pc.in                        |    10 +
 lib/i915/perf-configs/README.md            |   115 +
 lib/i915/perf-configs/codegen.py           |    33 +
 lib/i915/perf-configs/guids.xml            |   282 +
 lib/i915/perf-configs/mdapi-xml-convert.py |  1000 ++
 lib/i915/perf-configs/oa-bdw.xml           | 15653 +++++++++++++++++++
 lib/i915/perf-configs/oa-bxt.xml           |  9595 ++++++++++++
 lib/i915/perf-configs/oa-cflgt2.xml        | 10866 +++++++++++++
 lib/i915/perf-configs/oa-cflgt3.xml        | 10933 +++++++++++++
 lib/i915/perf-configs/oa-chv.xml           |  9757 ++++++++++++
 lib/i915/perf-configs/oa-cnl.xml           | 10411 ++++++++++++
 lib/i915/perf-configs/oa-glk.xml           |  9346 +++++++++++
 lib/i915/perf-configs/oa-hsw.xml           |  4615 ++++++
 lib/i915/perf-configs/oa-icl.xml           | 11899 ++++++++++++++
 lib/i915/perf-configs/oa-kblgt2.xml        | 10866 +++++++++++++
 lib/i915/perf-configs/oa-kblgt3.xml        | 10933 +++++++++++++
 lib/i915/perf-configs/oa-sklgt2.xml        | 11895 ++++++++++++++
 lib/i915/perf-configs/oa-sklgt3.xml        | 10933 +++++++++++++
 lib/i915/perf-configs/oa-sklgt4.xml        | 10956 +++++++++++++
 lib/i915/perf-configs/perf-codegen.py      |   854 +
 lib/i915/perf-configs/update-guids.py      |   230 +
 lib/i915/perf.c                            |   194 +
 lib/i915/perf.h                            |   238 +
 lib/meson.build                            |    64 +
 tools/i915-perf/i915_perf_configs.c        |   277 +
 tools/i915-perf/meson.build                |     5 +
 tools/meson.build                          |     1 +
 27 files changed, 151961 insertions(+)
 create mode 100644 lib/i915-perf.pc.in
 create mode 100644 lib/i915/perf-configs/README.md
 create mode 100644 lib/i915/perf-configs/codegen.py
 create mode 100644 lib/i915/perf-configs/guids.xml
 create mode 100755 lib/i915/perf-configs/mdapi-xml-convert.py
 create mode 100644 lib/i915/perf-configs/oa-bdw.xml
 create mode 100644 lib/i915/perf-configs/oa-bxt.xml
 create mode 100644 lib/i915/perf-configs/oa-cflgt2.xml
 create mode 100644 lib/i915/perf-configs/oa-cflgt3.xml
 create mode 100644 lib/i915/perf-configs/oa-chv.xml
 create mode 100644 lib/i915/perf-configs/oa-cnl.xml
 create mode 100644 lib/i915/perf-configs/oa-glk.xml
 create mode 100644 lib/i915/perf-configs/oa-hsw.xml
 create mode 100644 lib/i915/perf-configs/oa-icl.xml
 create mode 100644 lib/i915/perf-configs/oa-kblgt2.xml
 create mode 100644 lib/i915/perf-configs/oa-kblgt3.xml
 create mode 100644 lib/i915/perf-configs/oa-sklgt2.xml
 create mode 100644 lib/i915/perf-configs/oa-sklgt3.xml
 create mode 100644 lib/i915/perf-configs/oa-sklgt4.xml
 create mode 100755 lib/i915/perf-configs/perf-codegen.py
 create mode 100755 lib/i915/perf-configs/update-guids.py
 create mode 100644 lib/i915/perf.c
 create mode 100644 lib/i915/perf.h
 create mode 100644 tools/i915-perf/i915_perf_configs.c
 create mode 100644 tools/i915-perf/meson.build

diff --git a/lib/i915-perf.pc.in b/lib/i915-perf.pc.in
new file mode 100644
index 00000000..6524d0d9
--- /dev/null
+++ b/lib/i915-perf.pc.in
@@ -0,0 +1,10 @@
+prefix=@prefix@
+exec_prefix=@exec_prefix@
+libdir=@libdir@
+includedir=@includedir@
+
+Name: i915-perf
+Description: i915 perf library
+Version: @IGT_VERSION@
+Libs: -L${libdir} -li915_perf
+Cflags: -I${includedir}
diff --git a/lib/i915/perf-configs/README.md b/lib/i915/perf-configs/README.md
new file mode 100644
index 00000000..df31d6ae
--- /dev/null
+++ b/lib/i915/perf-configs/README.md
@@ -0,0 +1,115 @@
+# About guids.xml
+
+This is the authoritive registry of unique identifers for different OA unit
+hardware configurations. Userspace can reliably use these identifiers to map a
+configuration to corresponding normalization equations and counter meta data.
+
+If a hardware configuration ever changes in a backwards incompatible way
+(changing the semantics and/or layout of the raw counters) then it must be
+given a new GUID.
+
+mdapi-xml-convert.py will match metric sets with a GUID from this file based on
+an md5 hash of the hardware register configuration and skip a metric set with a
+warning if no GUID could be found.
+
+All new metric sets need to be allocated a GUID here before
+mdapi-xml-convert.py or i915-perf-kernelgen.py will output anything for that
+metric set. This ensures we don't automatically import new metric sets without
+some explicit review that that's appropriate.
+
+A failure to find a GUID for an older metric set most likely implies that the
+register configuration was changed. It's possible that the change is benign
+(e.g. a comment change) and in that case the mdapi_config_hash for the
+corresponding metric set below can be updated.
+
+The update-guids.py script is the recommended way of managing updates to this
+file by generate a temporary file with proposed updates that you can compare
+with the current guids.xml.
+
+
+# update-guids.xml
+
+update-guids.py can help with:
+
+* Recognising new metrics from VPG's MDAPI XML files
+
+  *(NOTE: new guids.xml entries will initially be missing the
+  config_hash=MD5_HASH attribute until mdapi-xml-convert.py is used to generate
+  a corresponding oa-*.xml config description)*
+
+* Adding a config_hash=MD5_HASH attribute to recently added guids.xml entries
+  after mdapi-xml-convert.py has been run.
+
+* Allocating a GUID for a custom metric that doesn't have a counterpart in
+  VPG's MDAPI XML files.
+
+  For this case you can add a stub entry with only a name like `<guid
+  name="Foo">` to guids.xml and then running update-guids.py will output a
+  corresponding line with the addition of an id=UUID attribute.
+
+
+# How to sync the oa-\*.xml files with latest internal MDAPI XML files
+
+1. E.g. copy a new `MetricsXML_BDW.xml` to `mdapi/MetricsXML_BDW.xml`
+
+*Note: that the `mdapi-xml-convert.py` script will only convert configs that
+have a corresponding GUID entry within `guids.xml`. This check helps avoid
+unintentionally publishing early, work-in-progress/pre-production configs.*
+
+The `guids.xml` registry maps each, complex OA unit register configuration to a
+unique ID that userspace can recognise and trust the semantics of raw counters
+read using that configuration. (Just for reference, this is particularly
+valuable for tools that capture raw metrics for later, offline processing since
+the IDs effectively provide a compressed description of how to interpret the
+data by providing an index into a database of high-level counter descriptions.)
+
+The registry associates each ID with a hash of the HW register config as found in
+MDAPI XML files ('mdapi_config_hash') and also with a hash of the HW config as
+found in oa-\*.xml files ('config_hash'). The hashes used for lookups in the
+registry also help detect when the register config for a pre-existing metric set
+is updated. Note: these hashes are only for the low-level hardware configuration
+so updates to counter descriptions used by fronted UIs won't affect indexing
+here.
+
+There is a chicken and egg situation when updating or adding new entries to
+guids.xml since we can't hash the configs in oa-\*.xml until successfully running
+mdapi-xml-convert.py which depends on a guids.xml registry entry first. The
+update-guids.xml script will output registry entries without an oa-\*.xml config
+hash if not available and can be re-run after mdapi-xml-convert.py to add the
+missing hashes.
+
+2. Now run:
+```
+./update-guids.py --guids=guids.xml mdapi/MetricsXML_BDW.xml > guids.xml2
+```
+*(note the script expects to find oa-\*.xml files in the current directory)*
+
+Diff `guids.xml` and `guilds.xml2` (easiest with a side-by-side diff editor) and
+review the registry changes. *Note: many lines will have a warning like `"Not
+found in MDAPI XML file[s]..."` if `update-guids.xml` wasn't given all known
+MDAPI XML files but in this case they can be ignored for all non-BDW configs.*
+
+*Note: for any config that is already supported upstream in the i915 perf driver
+we need to be careful if the hash for a metric set changes in case the semantics
+for any raw counters were changed. The semantics of raw counters associated with
+a given GUID form part of the drm i915 perf uapi contract and must remain
+backwards compatible.*
+
+If the diff shows any `mdapi_config_hash` changes for pre-existing (especially
+upstream) configs you should review the MDAPI XML changes for the metric set and
+verify the change just relates to a bug fix. If more substantial changes were
+made which could mean we need to treat it as a new config. Handling the later
+case is left as an exercise to the reader, since it hasn't happened so far :-D.
+Assuming all the changes and new entries look good they can be copied into
+`guids.xml`, removing any trailing comment left by `update-guids.py`.
+
+3. Now run mdapi-xml-convert.py:
+```
+./mdapi-xml-convert.py --guids=guids.xml mdapi/MetricsXML_BDW.xml > oa-bdw.xml
+```
+
+4. We can now update new entries in guids.xml with a 'config_hash':
+```
+./update-guids.py --guids=guids.xml mdapi/MetricsXML_BDW.xml > guids.xml2
+```
+*(and again diff, check the changes and copy across)*
diff --git a/lib/i915/perf-configs/codegen.py b/lib/i915/perf-configs/codegen.py
new file mode 100644
index 00000000..0802547a
--- /dev/null
+++ b/lib/i915/perf-configs/codegen.py
@@ -0,0 +1,33 @@
+class Codegen:
+
+    _file = None
+    _indent = 0
+
+    endl="\n"
+    use_tabs = False
+
+    def __init__(self, filename = None):
+        if filename != None:
+            self._file = open(filename, 'w')
+
+    def __call__(self, *args):
+        if self._file:
+            code = ' '.join(map(str, args))
+            for line in code.splitlines():
+                indent = ''.rjust(self._indent)
+
+                if self.use_tabs:
+                    indent = indent.replace("        ", "\t")
+
+                text = indent + line
+                self._file.write(text.rstrip() + self.endl)
+
+    #without indenting or new lines
+    def frag(self, *args):
+        code = ' '.join(map(str, args))
+        self._file.write(code)
+
+    def indent(self, n):
+        self._indent = self._indent + n
+    def outdent(self, n):
+        self._indent = self._indent - n
diff --git a/lib/i915/perf-configs/guids.xml b/lib/i915/perf-configs/guids.xml
new file mode 100644
index 00000000..159ad9e7
--- /dev/null
+++ b/lib/i915/perf-configs/guids.xml
@@ -0,0 +1,282 @@
+<!--
+    This is the authoritive registry of unique identifers for different OA unit
+    hardware configurations. Userspace can reliably use these identifiers to
+    map a configuration to corresponding normalization equations and counter
+    meta data.
+
+    Most maintenance is done using the update-guids.py helper script to generate
+    a temporary guids.xml.update file which should then be manually compared with
+    a visual diff tool to cherry pick the final changes into guids.xml.
+
+    See README.md for more details.
+-->
+<guids>
+    <guid id="2f01b241-7014-42a7-9eb6-a925cad3daba" chipset="all" name="MDAPI" />
+    <guid config_hash="b96ab550dbb61fa1d1a98b2d6f938e9c" mdapi_config_hash="c675607e7d1b0083729e4b1621fd25f8" id="a490e9d2-55b3-4db0-8dab-53011032c5f3" chipset="hsw" name="RenderBasic" />
+    <guid config_hash="3b656e19962cf1990cfb253a59946266" mdapi_config_hash="09199618ca154304fd42ca5ee19187f4" id="b344c8cb-a291-4cbf-aa9c-b40213bfc96f" chipset="hsw" name="ComputeBasic" />
+    <guid config_hash="bb978ccd4f1eca6d7806f304a42fb10f" mdapi_config_hash="77524b565825e61259436f526848c1e1" id="480f9795-cf6a-4204-a9e3-cd7015515f8d" chipset="hsw" name="ComputeExtended" />
+    <guid config_hash="890e4b72a09b71cb9c4522fbd8f7e45a" mdapi_config_hash="28d4ec8839e660bac90c3fbfa815ce45" id="399d3001-97d6-4240-b065-4fb843138e17" chipset="hsw" name="MemoryReads" />
+    <guid config_hash="904374d80088ec4941ab3c1dbed1aac0" mdapi_config_hash="6a8cbc42da4822a17d3de385d6811c1a" id="f3c1ff4b-d0da-4ffa-8780-2c6b98f3f2d5" chipset="hsw" name="MemoryWrites" />
+    <guid config_hash="35111d939881fd8e2367f89f86b43d19" mdapi_config_hash="4f8c749ea23ece9349cf690908159b6b" id="e111cda4-19c3-41ee-b326-f99ac44ebf78" chipset="hsw" name="SamplerBalance" />
+    <guid mdapi_config_hash="3c2ee9a97141f36bc13828aeda30e477" id="ce81ddfb-573f-4100-8b9a-8dc93a5e5c8c" chipset="hsw" name="RenderBalance" />
+    <guid mdapi_config_hash="7ffc6e4d3d2284ea76e9390b0fd8aaf1" id="2fbbb85b-0f33-4aeb-9d92-35256de2662f" chipset="hsw" name="MemoryReadsOnWritePort" />
+    <guid mdapi_config_hash="ff6824b311096312105547bbe5e65758" id="a1476140-3af3-4556-b5fe-501e2df8b963" chipset="hsw" name="StencilPmaHold" />
+    <guid mdapi_config_hash="414afdc7b2570bbbe07406ec675f3040" id="b3d5350e-32ba-4c72-96c2-0a504e86eda3" chipset="hsw" name="MediaMemoryReads" />
+    <guid mdapi_config_hash="cf80117b63d376e87735b73e8f5ebc5b" id="69b42918-c915-439a-9e4b-a82fe3c9e1a3" chipset="hsw" name="MediaMemoryWrites" />
+    <guid mdapi_config_hash="3566f20e9e3707cb9aefccff3ead7572" id="18024740-aa68-4d25-877e-082c9fdcb895" chipset="hsw" name="MediaVmePipe" />
+    <guid config_hash="240f9cd7a6699b44ff0bf22b24449ac0" mdapi_config_hash="961180e14745136637cfd0253c6c0a63" id="d6de6f55-e526-4f79-a6a6-d7315c09044e" chipset="bdw" name="TestOa" />
+    <guid config_hash="9c4955c220cbcc5f9ff3ce6e7af64cf5" mdapi_config_hash="7f7918e87f574f62cc4e8d37f660abc5" id="b541bd57-0e0f-4154-b4c0-5858010a2bf7" chipset="bdw" name="RenderBasic" />
+    <guid config_hash="35d980685774e3631a7e5eb4d23a0013" mdapi_config_hash="ea406bf4dc4e4edd5e29cce12bef1778" id="35fbc9b2-a891-40a6-a38d-022bb7057552" chipset="bdw" name="ComputeBasic" />
+    <guid config_hash="d17b0801f998c4b119c63b0467e8f9b5" mdapi_config_hash="fbde7829568089b44b53a1eefbad9b0e" id="8fb61ba2-2fbb-454c-a136-2dec5a8a595e" chipset="bdw" name="ComputeExtra" />
+    <guid config_hash="1bb1be4885c0568bf0d3bd5df9fe4a7a" mdapi_config_hash="f0c3b043834e63d21ba6be573df02e32" id="233d0544-fff7-4281-8291-e02f222aff72" chipset="bdw" name="RenderPipeProfile" />
+    <guid config_hash="9147786065e1562d254a1dc82c14b4f9" mdapi_config_hash="fa121c59e98aa4f860c797bfab097cd7" id="2b255d48-2117-4fef-a8f7-f151e1d25a2c" chipset="bdw" name="MemoryReads" />
+    <guid config_hash="13cadf5e130b16bf6cf777e34ff54fcf" mdapi_config_hash="7e324f6f7cb980832735ada1e12f7905" id="f7fd3220-b466-4a4d-9f98-b0caf3f2394c" chipset="bdw" name="MemoryWrites" />
+    <guid config_hash="552b53f8d91428cec6eab6bff62ae8af" mdapi_config_hash="6ba093cf3feb68f521e579169ad689cf" id="e99ccaca-821c-4df9-97a7-96bdb7204e43" chipset="bdw" name="ComputeExtended" />
+    <guid config_hash="2cf68f22eadf4cb430a7e2a76fab3632" mdapi_config_hash="e9913c0dd30d6ccab98c5dec58dc7162" id="27a364dc-8225-4ecb-b607-d6f1925598d9" chipset="bdw" name="ComputeL3Cache" />
+    <guid config_hash="15d5387219cda641a8964b9edeb86b6d" mdapi_config_hash="fc357f19e2a77465c3232693f3bb1444" id="857fc630-2f09-4804-85f1-084adfadd5ab" chipset="bdw" name="DataPortReadsCoalescing" />
+    <guid config_hash="95a2d953682c60ee0213c41892067b94" mdapi_config_hash="be3980a5f0e6057e641b884fc56b07ff" id="343ebc99-4a55-414c-8c17-d8e259cf5e20" chipset="bdw" name="DataPortWritesCoalescing" />
+    <guid config_hash="9004a46b9728e0f12232ce8b151d3224" mdapi_config_hash="715fe2c431914b6b369970c0b897f7e2" id="e1743ca0-7fc8-410b-a066-de7bbb9280b7" chipset="bdw" name="VMEPipe" />
+    <guid config_hash="bb8d49db81e7bd822188ed5a958b4863" mdapi_config_hash="f94fd6ba5bfa83bb965705f1c69f1d37" id="78490af2-10fa-430b-ae3c-94ec04d5214e" chipset="bdw" name="HDCAndSF" />
+    <guid config_hash="19924ef1563f10e386755b531d44a3fb" mdapi_config_hash="a5589479b360f6d4f5c8f70fe78b0e1d" id="c0abdd97-3b13-4cad-814c-bd178804e02c" chipset="bdw" name="L3_1" />
+    <guid config_hash="41217f1f74d9e181726736ab9af57c32" mdapi_config_hash="0fc152bfbb920f90b16ed0445afe9e48" id="ad665281-a7cf-483a-bd10-0e07c43f61c7" chipset="bdw" name="L3_2" />
+    <guid config_hash="f17717dae4348688c670212b507d451a" mdapi_config_hash="2afc3cdd7ffbb021fc0ae99681b138ab" id="930a15aa-4300-4fce-a9ba-edb0b9e880be" chipset="bdw" name="L3_3" />
+    <guid config_hash="71232cf595afad2b53666f6c233447e8" mdapi_config_hash="032c9ab7c2c6d056da82e4ee1b159c18" id="d7793b26-b5e3-4f0f-ad78-7ebc9d0b4c7d" chipset="bdw" name="L3_4" />
+    <guid config_hash="b8a474b7965b6d9ec62641732d0d479b" mdapi_config_hash="b2454e1eef8d38d83cb95ba2b3d85431" id="da0f7875-1143-4d73-a39c-9128a951c46a" chipset="bdw" name="RasterizerAndPixelBackend" />
+    <guid config_hash="f8f05a9f4ce4bd928f1343180584f7de" mdapi_config_hash="6fb026e2926fbd3a507e55a7bf0a3687" id="52c186e4-39e3-4534-87cd-41bd47763df9" chipset="bdw" name="Sampler_1" />
+    <guid config_hash="30ee983d5ba223ad552acc3debc13c00" mdapi_config_hash="e38e63da0d875958bc88a9deb8d529ba" id="edcb8c31-764d-451a-9ecd-c9c89fb54f8d" chipset="bdw" name="Sampler_2" />
+    <guid config_hash="bbc70da24570ab578fb1416217fc0834" mdapi_config_hash="c905876bdf561cc26c64363ced258c64" id="729fc3f4-ccff-4902-be6b-f1a22cc92c02" chipset="bdw" name="TDL_1" />
+    <guid config_hash="803ca6eb4feef4090332003b65607c95" mdapi_config_hash="0000753d7f52fb3a0b0baa6b44052cff" id="29598975-4785-43ab-a981-1dfa58d0e835" chipset="bdw" name="TDL_2" />
+    <guid config_hash="c45ebb398888eabb889be632432550eb" mdapi_config_hash="a3c52d64b6d187b02de43af112abc509" id="0a9eb7be-feee-4275-a139-6d9cedf0fdb0" chipset="bdw" name="GpuBusyness" />
+    <guid config_hash="13a7f7de484592659ef4d346901bde25" mdapi_config_hash="59cd2454083f4855dca14637425d733c" id="e713f347-953e-4d8c-b02f-6be31df2db2b" chipset="bdw" name="STC_PmaStall" />
+    <guid config_hash="867e736ad8c49a9f4cd17b58f1b0b0cc" mdapi_config_hash="d996104bf7531170226275d44a3602b6" id="4a534b07-cba3-414d-8d60-874830e883aa" chipset="chv" name="TestOa" />
+    <guid config_hash="4fe7c53a36b24f621e11a1487d46e325" mdapi_config_hash="089852d3f5babff2175457f57214ce57" id="9d8a3af5-c02c-4a4a-b947-f1672469e0fb" chipset="chv" name="RenderBasic" />
+    <guid config_hash="6472c5788ff47d2f8f88b86b7314c09e" mdapi_config_hash="60375bf6570a28320cce512ab6d024e0" id="f522a89c-ecd1-4522-8331-3383c54af5f5" chipset="chv" name="ComputeBasic" />
+    <guid config_hash="532bafcf355d5812242ab50a362bf934" mdapi_config_hash="1466be3c679aeeb0627be174ead35e58" id="a9ccc03d-a943-4e6b-9cd6-13e063075927" chipset="chv" name="RenderPipeProfile" />
+    <guid config_hash="bb8d49db81e7bd822188ed5a958b4863" mdapi_config_hash="f94fd6ba5bfa83bb965705f1c69f1d37" id="33af8252-7a51-4aa3-b0ba-1b946f209d7b" chipset="chv" name="HDCAndSF" />
+    <guid config_hash="19924ef1563f10e386755b531d44a3fb" mdapi_config_hash="a5589479b360f6d4f5c8f70fe78b0e1d" id="78f52900-5317-4417-8067-966fbf215a1f" chipset="chv" name="L3_1" />
+    <guid config_hash="41217f1f74d9e181726736ab9af57c32" mdapi_config_hash="0fc152bfbb920f90b16ed0445afe9e48" id="0db4fe4a-2648-4064-bd6a-89c06d0c27b3" chipset="chv" name="L3_2" />
+    <guid config_hash="f17717dae4348688c670212b507d451a" mdapi_config_hash="2afc3cdd7ffbb021fc0ae99681b138ab" id="0de6539e-33b4-4aee-83c4-9ab45a579b94" chipset="chv" name="L3_3" />
+    <guid config_hash="71232cf595afad2b53666f6c233447e8" mdapi_config_hash="032c9ab7c2c6d056da82e4ee1b159c18" id="be74c9d6-268f-4d7f-b2e8-8d91d4441883" chipset="chv" name="L3_4" />
+    <guid config_hash="b8a474b7965b6d9ec62641732d0d479b" mdapi_config_hash="b2454e1eef8d38d83cb95ba2b3d85431" id="31bc1ff3-8d09-4497-9d79-59c4f943b502" chipset="chv" name="RasterizerAndPixelBackend" />
+    <guid config_hash="f8f05a9f4ce4bd928f1343180584f7de" mdapi_config_hash="6fb026e2926fbd3a507e55a7bf0a3687" id="05450fec-bb5c-4b0a-8995-e03631168a34" chipset="chv" name="Sampler_1" />
+    <guid config_hash="30ee983d5ba223ad552acc3debc13c00" mdapi_config_hash="e38e63da0d875958bc88a9deb8d529ba" id="883c8a56-8767-4de8-beec-a99462c6674b" chipset="chv" name="Sampler_2" />
+    <guid config_hash="bbc70da24570ab578fb1416217fc0834" mdapi_config_hash="c905876bdf561cc26c64363ced258c64" id="eb97e523-d9ac-48a9-b7f8-9cc909ddbf14" chipset="chv" name="TDL_1" />
+    <guid config_hash="803ca6eb4feef4090332003b65607c95" mdapi_config_hash="0000753d7f52fb3a0b0baa6b44052cff" id="dff6158e-8409-452c-be76-91c9946330bd" chipset="chv" name="TDL_2" />
+    <guid mdapi_config_hash="5cc4d10d745060d0672ffb4ebf0d1687" id="22480aac-b81a-40ce-8770-1061ce51dff7" chipset="chv" name="StencilPmaHold" />
+    <guid mdapi_config_hash="f3ae7e16e9b6aadac98179bc4c847246" id="f8315f64-668e-405e-a6d6-c52e4d9e8f1c" chipset="chv" name="MediaMemoryReads" />
+    <guid mdapi_config_hash="ea98859ab4afdda2589be697455c7dc8" id="6df9f4c3-4775-4f47-be6a-991fba7a02c7" chipset="chv" name="MediaMemoryWrites" />
+    <guid mdapi_config_hash="179e6a40c74a8401597b82383dacfd70" id="e7b839a6-6045-4ec7-aaa5-f6aab87a55aa" chipset="chv" name="MediaVmePipe" />
+    <guid mdapi_config_hash="3ed20c9f7071cef87fd28d2f899c9e6c" id="aa7d6b37-3e8f-46a4-ab50-e58f8efbdab9" chipset="chv" name="HdcUrbCoalescing" />
+    <guid mdapi_config_hash="b39b58578bb37520010084d2fb489c47" id="d991c4b4-7c8b-43a9-b187-7b143cb903cc" chipset="chv" name="L3" />
+    <guid mdapi_config_hash="36c6e4beda33281c27a79f4134ea9f80" id="531d4a91-df08-4dd4-8c5c-0158321a9ee0" chipset="chv" name="SamplerAndHDCAndTDL" />
+    <guid mdapi_config_hash="959a0f3d993feb51a3ce93ea3b61d726" id="ca514a15-e550-4277-ba52-b7cfa4929e25" chipset="chv" name="TDL" />
+    <guid mdapi_config_hash="f1232ea7b1a2bc5b0cfc7d640528e5b2" id="2a933a92-bddc-44dd-a06a-672391972b5e" chipset="chv" name="ComputeL3Cache" />
+    <guid config_hash="e018d083414e4d28e0ed481554128883" mdapi_config_hash="dce59e977ffff25a57f2486f5d9a7c60" id="5ee72f5c-092f-421e-8b70-225f7c3e9612" chipset="bxt" name="TestOa" />
+    <guid config_hash="203852243e7fde6887b1db92862d5eee" mdapi_config_hash="9bf85c8db90bbb173411dd8fbf2c9d90" id="22b9519a-e9ba-4c41-8b54-f4f8ca14fa0a" chipset="bxt" name="RenderBasic" />
+    <guid config_hash="cde046a01aba9c56d6fa44bf2c0f26c2" mdapi_config_hash="86794812560853ea5531d6eb816c7bfa" id="012d72cf-82a9-4d25-8ddf-74076fd30797" chipset="bxt" name="ComputeBasic" />
+    <guid config_hash="a19a55aad269ccc1ed4380314eda4bed" mdapi_config_hash="ac34c2028f3f4fae92e58aae1496901b" id="fa6ecf21-2cb8-4d0b-9308-6e4a7b4ca87a" chipset="bxt" name="ComputeExtra" />
+    <guid config_hash="1669463a6836f6d057cbf3e41506923b" mdapi_config_hash="c4b66b414f42b7e6f1b9941b445f79f2" id="ce416533-e49e-4211-80af-ec513590a914" chipset="bxt" name="RenderPipeProfile" />
+    <guid config_hash="f9eee3f0c9653ffd05e4876be0ea44d5" mdapi_config_hash="f707783ff8ea456ddc55fbaeb1a3bc0a" id="398e2452-18d7-42d0-b241-e4d0a9148ada" chipset="bxt" name="MemoryReads" />
+    <guid config_hash="03e840f1d8597b3c6c4015792243ce7d" mdapi_config_hash="b7e416688493d93c6a319a39c1c91fda" id="d324a0d6-7269-4847-a5c2-6f71ddc7fed5" chipset="bxt" name="MemoryWrites" />
+    <guid config_hash="39a03c065f1fdb5bf680207dc520cdb2" mdapi_config_hash="c90ecb54cbe7609fc6743f5273b68962" id="caf3596a-7bb1-4dec-b3b3-2a080d283b49" chipset="bxt" name="ComputeExtended" />
+    <guid config_hash="c241c2999f487dc995cecdb35b01197b" mdapi_config_hash="03f5a72e5e1ce82b6e3e14855298bf3d" id="49b956e2-d5b9-47e0-9d8a-cee5e8cec527" chipset="bxt" name="ComputeL3Cache" />
+    <guid config_hash="37dc8ae76c2554b11ecea682f1349ece" mdapi_config_hash="16b7f908edc7ee5ddb797c6fb1932fa6" id="ad9d9bc2-ccb7-4f5d-adbb-b4e67e615efd" chipset="bxt" name="HDCAndSF" />
+    <guid config_hash="543b9bdb10f681d516d8d9e2195221cd" mdapi_config_hash="87f92d7860a6674bf05428c26523755b" id="bde7b434-349c-4aad-8596-eb23c0352168" chipset="bxt" name="L3_1" />
+    <guid config_hash="1dc29cbbceb8e2e1a78d679ead80a27b" mdapi_config_hash="c7ec60f268b8efa00960e96dc9491517" id="f3d845e6-bfc3-4ffe-b0e5-dddc80c21f07" chipset="bxt" name="RasterizerAndPixelBackend" />
+    <guid config_hash="0b9e45ed32513193354be363e288b6a6" mdapi_config_hash="ad512c0f8b7457df8edca72ddea75e64" id="a53d620b-c14e-49df-bd27-e076b3fb98f3" chipset="bxt" name="Sampler" />
+    <guid config_hash="3f01b8d28fa285e7a496081574de4c1b" mdapi_config_hash="963e6d32bfe8cee347a8ae14d677c11c" id="8a44b172-6e1d-445f-8937-c06cc487ba39" chipset="bxt" name="TDL_1" />
+    <guid config_hash="0c77cba2d8886c18df9f382ce90eac66" mdapi_config_hash="a66f0092b99ca3a8ce29e0ce4be513ff" id="9d4643f8-aa05-482e-8193-070a8ab0d117" chipset="bxt" name="TDL_2" />
+    <guid config_hash="e6d52ba7af730de63eeaa8d727b36ed7" mdapi_config_hash="6898bc10a62600907cc6c47d1f7004a0" id="c9f5fa3a-d14f-400c-a89a-211206b00ee7" chipset="bxt" name="GpuBusyness" />
+    <guid config_hash="6d13f443205926fd1351ae5adeae8965" mdapi_config_hash="24f384a77963d7d64c324b3d89eeb498" id="d49cd0d8-8c7f-4465-94fc-51e08c9050bc" chipset="bxt" name="PMA_Stall" />
+    <guid config_hash="fc79f102b841df08ac154ddebc634bf6" mdapi_config_hash="3c97b92455702ca6f6a6f846dcc1ebd3" id="07b25942-d9fd-4fce-bd58-e29abd66b7de" chipset="sklgt2" name="RenderBasic" />
+    <guid config_hash="3e0e14aef4a2cf7e61098928c034caff" mdapi_config_hash="ecb641130c942e71d5a9de8adb51c7f6" id="00b80b4c-d215-4378-9015-da3dda3b61ea" chipset="sklgt2" name="ComputeBasic" />
+    <guid config_hash="d757768d43838dd04e2db7e9928c87d9" mdapi_config_hash="79c6baee9374a6c43b8e0fabda2c1a39" id="2a0c0933-37e7-427c-9951-ded42a78bb27" chipset="sklgt2" name="RenderPipeProfile" />
+    <guid config_hash="15938384237d1b01ceb07bc97edd12a9" mdapi_config_hash="22327f250c6079d5d5f9f1a70829dc05" id="246b35f1-44e0-4d03-8936-e452e291d064" chipset="sklgt2" name="MemoryReads" />
+    <guid config_hash="a0c0e0b3ad6e0960c9e3c626e9943c3b" mdapi_config_hash="5dcf9b09ab723e2f4ed17171a2b54a59" id="e0d3da02-00bf-4a96-9795-b48158c73a68" chipset="sklgt2" name="MemoryWrites" />
+    <guid config_hash="31bc9b67c237e4be9469d38ba69ec374" mdapi_config_hash="37e00c6654e34eaab18b6f3b2c606a16" id="c26b1fda-2752-4a33-a448-4c8718366846" chipset="sklgt2" name="ComputeExtended" />
+    <guid config_hash="a142f4714f9189816e129d2bf7ddd060" mdapi_config_hash="cdf98d85d93792dc203d2bfd7ae7559c" id="9fb22842-e708-43f7-9752-e0e41670c39e" chipset="sklgt2" name="ComputeL3Cache" />
+    <guid config_hash="977641d9cac7a2eb62c1c6cc844db2b5" mdapi_config_hash="a70cc632725191096cec1d685119aeb6" id="b4aa5e13-2d25-418f-827d-421f5cc4c43b" chipset="sklgt2" name="HDCAndSF" />
+    <guid config_hash="45aaf271f503f5d5d152b6d97c11412d" mdapi_config_hash="6b111ab20f6929a385eee8d283768ac1" id="504000e8-64f2-4aac-8301-51b81aa60d45" chipset="sklgt2" name="L3_1" />
+    <guid config_hash="6221743043a92819571c49bde5e09582" mdapi_config_hash="0b87bde0336f1d126527c9d8b0e6fa3c" id="f542479b-6685-4670-ad8e-9fe282a2eb5b" chipset="sklgt2" name="L3_2" />
+    <guid config_hash="b6320b7867895a125dec55805a8da286" mdapi_config_hash="7eae454eee816d64ff0fbb991ad4e9b9" id="1cbf1e9f-c2de-4cc2-8d1c-2c33c25a2332" chipset="sklgt2" name="L3_3" />
+    <guid config_hash="35f7405d36fe5767f4c1e80b322243d1" mdapi_config_hash="78b90bbcc0137b2c6e516cb32d44747c" id="b4e54cc8-a3a0-4ccd-9990-65d3184e5a38" chipset="sklgt2" name="RasterizerAndPixelBackend" />
+    <guid config_hash="6e2319f2ca15bfb049b2d1be6d1a0844" mdapi_config_hash="73ceeb4df0d124c61328ecf2c0207503" id="efe7eba4-fd9e-4a09-a92b-334970b5de57" chipset="sklgt2" name="Sampler" />
+    <guid config_hash="90eff0b1f381a2f187bd54f2047ce0f2" mdapi_config_hash="e0913ff09629a32c435487a69f6683b9" id="e9bd0bbb-c7b7-4a26-a27a-246987354776" chipset="sklgt2" name="TDL_1" />
+    <guid config_hash="c41684d2ccbe553874fb9cdbd8fd0229" mdapi_config_hash="6b1a9dc8dd375bf367313ad9b0531580" id="0a7accbf-8c55-455f-9984-23e9fb0b826d" chipset="sklgt2" name="TDL_2" />
+    <guid config_hash="483a06910590c1753a0266ef8b9f9b70" mdapi_config_hash="4be337ed83e3c95aebf66553ed685602" id="41a24047-7484-4ead-ae37-de907e5ff2b2" chipset="sklgt2" name="ComputeExtra" />
+    <guid config_hash="784698b7fb41dad7bc4bf13fac46657b" mdapi_config_hash="2fe32bdaf82fc66774ee95c33a23ea88" id="95910492-943f-44bd-9461-390240f243fd" chipset="sklgt2" name="VMEPipe" />
+    <guid config_hash="d2e36c07c43f128370fe1112d4de1181" mdapi_config_hash="d569893983ce055b9021b64420894431" id="1651949f-0ac0-4cb1-a06f-dafd74a407d1" chipset="sklgt2" name="TestOa" />
+    <guid config_hash="ee7996e47cdaf7722422397285763cdc" mdapi_config_hash="ada812fc71ebbabd1e746dbab67881b1" id="c44a5cf7-886d-477b-bebd-2d738923e4c3" chipset="sklgt2" name="GpuBusyness" />
+    <guid config_hash="cec6202194db96d6a09fed71808bb7de" mdapi_config_hash="df4b9b85ed61f457a0b71b03299b282d" id="e0b2aae4-9b8f-4211-8df0-f8e8cb203209" chipset="sklgt2" name="FfBottlenecks" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="e7f3f72cad542f3a17c09686e65487fc" id="27871149-2fa9-40ba-aa73-350d60c03a09" chipset="sklgt2" name="PMA_Stall" />
+    <guid config_hash="a7f1b241b23898785166ab10ca4ce1bf" mdapi_config_hash="ae3528402606bbb21a08da7ef5ea1530" id="21fef15a-83f4-4ffa-bb81-7da6e38b8e4b" chipset="sklgt3" name="RenderBasic" />
+    <guid config_hash="ede53df6549f788495f7fca90475b6dd" mdapi_config_hash="87390c127ce809c3cfab64388ddebd14" id="4320492b-fd03-42ac-922f-dbe1ef3b7b58" chipset="sklgt3" name="ComputeBasic" />
+    <guid config_hash="0f8eee02ed3e457362ffdc38ed10036c" mdapi_config_hash="2d95f03caa28b40e2a25f3bc8ac38b55" id="bd2d9cae-b9ec-4f5b-9d2f-934bed398a2d" chipset="sklgt3" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="5218add4f4b16f3db5c92225871eb44c" id="4ca0f3fe-7fd3-4924-98cb-1807d9879767" chipset="sklgt3" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="adc8e37f86eda900faf1fdb41f5dc3ee" id="a0c0172c-ee13-403d-99ff-2bdf6936cf14" chipset="sklgt3" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="f3ce984974a95b391e835b3a75aa7813" id="52435e0b-f188-42ea-8680-21a56ee20dee" chipset="sklgt3" name="ComputeExtended" />
+    <guid config_hash="f660e82bbeca0b5d2d31a98dac8eb940" mdapi_config_hash="7b6f81c79c79fb31b0fe5eea542e479f" id="27076eeb-49f3-4fed-8423-c66506005c63" chipset="sklgt3" name="ComputeL3Cache" />
+    <guid config_hash="2c6650c2422869aa2624b26f7a7c51bc" mdapi_config_hash="1ce5fbfd5db4183dfc3ab6bf4badfd59" id="a1b8363b-b986-47b6-929a-847afde3dec8" chipset="sklgt3" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="269534866dc93d83e1e5934bd4900a89" id="fa857069-7f95-44c9-a3e0-cb8ccbc35abb" chipset="sklgt3" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="745f63effe3156a5f358999d45bd66c6" id="9830a5f3-a5e2-4773-a49d-6371407c382a" chipset="sklgt3" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="b46614ab9a28c8a7fe88897cd72437bd" id="59452ceb-24bb-4878-87ec-87aab7b4f9db" chipset="sklgt3" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="7d797e538b84f6682caacdfb299145d9" id="d2249ff7-34b4-4203-b474-7c11546f9dae" chipset="sklgt3" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="1db0203064f7e2f8cb02901fe29a1d33" id="c9cf7c63-0065-4226-941e-98590bad8f75" chipset="sklgt3" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="781425b1a57e4ea0010105f565567161" id="e3bb1501-89ca-43fb-8668-9d96159e10a2" chipset="sklgt3" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="66d2a4df7b3190be8bd9643e1cb14f99" id="29194a55-7e75-4152-a71f-ef34b1ae4cca" chipset="sklgt3" name="TDL_2" />
+    <guid config_hash="3ca2784da64d161a998b7d8f6d4e0235" mdapi_config_hash="5796dcc1e154e567d7758854bb621bcb" id="2d80a648-7b5a-4e92-bbe7-3b5c76f2e221" chipset="sklgt3" name="ComputeExtra" />
+    <guid config_hash="54b2a9ae72018dd99e63c2ecd9c92901" mdapi_config_hash="6ae821fe8ac78f4b387f9eec605ac900" id="cfae9232-6ffc-42cc-a703-9790016925f0" chipset="sklgt3" name="VMEPipe" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="d05fe58178a1882edcb81d86070551e3" id="2b985803-d3c9-4629-8a4f-634bfecba0e8" chipset="sklgt3" name="TestOa" />
+    <guid config_hash="6124b939906bc3cda3621544aabfd890" mdapi_config_hash="24ef7b4026d1ac159bb663946df0e9b0" id="0c5058ff-fdf4-4e0d-81fb-c0310fb76525" chipset="sklgt3" name="GpuBusyness" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="c889fd93-8dc7-4ba5-9451-de34a8b5ea3f" chipset="sklgt3" name="PMA_Stall" />
+    <guid config_hash="0a80b2a2caa3386ecce110a7904eb1c1" mdapi_config_hash="61d002ce457b9ce087613d986e6b0544" id="95322a71-bb05-4437-bc27-f7dd7b27d136" chipset="sklgt4" name="RenderBasic" />
+    <guid config_hash="898ee42bb4b359d4c0eb97c5919cfd7f" mdapi_config_hash="d596d8f326e5378b871b825eb954e95c" id="7277228f-e7f3-4743-945a-6a2049d11377" chipset="sklgt4" name="ComputeBasic" />
+    <guid config_hash="48b5556f95fc27dceb10c65556a16613" mdapi_config_hash="95e3f2b556fe9795e0d0e0d3b0c5ee00" id="463c668c-3f60-49b6-8f85-d995b635b3b2" chipset="sklgt4" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="d39a578cdf930d109c992f4abd7f83cb" id="3ae6e74c-72c3-4040-9bd0-7961430b8cc8" chipset="sklgt4" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="603b987097b9d84c53eb55c60272b286" id="055f256d-4052-467c-8dec-6064a4806433" chipset="sklgt4" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="26c920eddaf1b7e2d58c37a96d4076bd" id="753972d4-87cd-4460-824d-754463ac5054" chipset="sklgt4" name="ComputeExtended" />
+    <guid config_hash="96d8e8d820ebad84b71c222f3c448ec5" mdapi_config_hash="182cd4a00f7a24a0c844bf9f8435419e" id="4e4392e9-8f73-457b-ab44-b49f7a0c733b" chipset="sklgt4" name="ComputeL3Cache" />
+    <guid config_hash="25ad6a99a2b00414d4747035af7fac94" mdapi_config_hash="f69a28470a231f8d0c20e3173274cf88" id="75f56991-b149-4122-ade9-d9c0c80c733b" chipset="sklgt4" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="52b2279e32293bfe3cf97e443940215a" id="0d4cda70-da83-466f-b61e-7a064fe6a232" chipset="sklgt4" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="1541624f29b55f8abf422eaa813657e7" id="20137ace-b110-4341-883f-1094c820093c" chipset="sklgt4" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="c734154b7a9bd205b8bfb176211873c3" id="d3a6b05e-46ef-44a8-96c3-9bd3e58acbe6" chipset="sklgt4" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="0fbb2b2f53429b0a25a6628c1fb21b32" id="4081b948-63f1-4b1a-abaa-6017cb77a63b" chipset="sklgt4" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="032dea8a40f7c0bbe2c9e0a238df248d" id="eae6bbb1-0e2b-478d-bd9e-f10ded2178f9" chipset="sklgt4" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="39a8e4da917b0874b8e697f203a641ff" id="1bba4bd2-81d4-45ec-847f-bc363e17e14d" chipset="sklgt4" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="60b1253d54ce38bb6678d9a3eaa10305" id="a4b3106c-cfec-49f5-8e26-470470379e66" chipset="sklgt4" name="TDL_2" />
+    <guid config_hash="19cb1c38ee83566f630015215532efa5" mdapi_config_hash="f9ae90355e5abe786bf5e81f1c4222c0" id="a5aa857d-e8f0-4dfa-8981-ce340fa748fd" chipset="sklgt4" name="ComputeExtra" />
+    <guid config_hash="b28f9fef3bf5699c217d634bffa57fbc" mdapi_config_hash="cafc4d5abc6807434093d4f47fe83292" id="0e8d8b86-4ee7-4cdd-aaaa-58adc92cb29e" chipset="sklgt4" name="VMEPipe" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="051007cbfaffa4151d7c9365edde7bff" id="882fa433-1f4a-4a67-a962-c741888fe5f5" chipset="sklgt4" name="TestOa" />
+    <guid config_hash="6124b939906bc3cda3621544aabfd890" mdapi_config_hash="24ef7b4026d1ac159bb663946df0e9b0" id="4e5b1599-5b01-4b3d-89fa-6b26a25fe02b" chipset="sklgt4" name="GpuBusyness" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="befe9fd6-474e-4a3d-b98e-cd793715cf91" chipset="sklgt4" name="PMA_Stall" />
+    <guid config_hash="afbe2cb999a8303f52eea075f3b8687e" mdapi_config_hash="966416aaaf33b0bce90c0daa51217242" id="99c1a40e-a090-4354-86e3-4d068bb1917e" chipset="kblgt2" name="RenderBasic" />
+    <guid config_hash="e337295245fb93eccf7b096f2728ca98" mdapi_config_hash="86040ee918c1b39c616b777101369f16" id="e17fc42a-e614-41b6-90c4-1074841a6c77" chipset="kblgt2" name="ComputeBasic" />
+    <guid config_hash="01f86f590b9b0c0371b0075a5e73b902" mdapi_config_hash="7ee27e7f11eea3282e62abde604b61a2" id="d7a17a3a-ca71-40d2-a919-ace80d50633f" chipset="kblgt2" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="0779bba85f8be3baef98ecc5c66fd369" id="57b59202-172b-477a-87de-33f85572c589" chipset="kblgt2" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="26eb749438ad7d42e34342048c1019c5" id="3addf8ef-8e9b-40f5-a448-3dbb5d5128b0" chipset="kblgt2" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="aa2dd4e7d446e3ce29dfeaf8f393243e" id="4af0400a-81c3-47db-a6b6-deddbd75680e" chipset="kblgt2" name="ComputeExtended" />
+    <guid config_hash="33bdd2160049aa831e025e1be7a453c5" mdapi_config_hash="2770df840fca647230d55b79f686ae11" id="0e22f995-79ca-4f67-83ab-e9d9772488d8" chipset="kblgt2" name="ComputeL3Cache" />
+    <guid config_hash="5736948ed298fd6e8cc80222e1e03077" mdapi_config_hash="c056251351b0b1f5beb4f6863484854b" id="fb149d66-fad2-4230-b0d7-4d689b9116d3" chipset="kblgt2" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="17d38bff109de8e5622ff29bead0bbcf" id="f889f8cc-4c93-4ac8-b75f-551c0b9b87f7" chipset="kblgt2" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="1a88f6816aea2c42dae9f10d4233cb74" id="6d344efd-8e9e-42d4-a29e-1011c29f82c2" chipset="kblgt2" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="ae28a594b1a6fd3864272da8dbe873f5" id="e3b386ae-c195-47d5-af29-8a1afa0ae2bf" chipset="kblgt2" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="d1b2421e43a489ffcdfeeaf271b2f12f" id="f9954679-a055-4862-9f57-9d66e3ebf81c" chipset="kblgt2" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="8d5f977be4f4d21e97e9e67786958495" id="4ed5e27e-fd1a-4f11-ad8f-9374e128c697" chipset="kblgt2" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="cbef2ea0f1c6e30bd37cea22a87e8373" id="9eaf384d-8f53-41b8-a71d-108308780fbc" chipset="kblgt2" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="b685ab8fe6fc020e85f189f55fdf6e05" id="a00cbdf2-eabd-4240-9a89-86e2ac1ca1e4" chipset="kblgt2" name="TDL_2" />
+    <guid config_hash="483a06910590c1753a0266ef8b9f9b70" mdapi_config_hash="4be337ed83e3c95aebf66553ed685602" id="aa7a3fb9-22fb-43ff-a32d-0ab6c13bbd16" chipset="kblgt2" name="ComputeExtra" />
+    <guid config_hash="784698b7fb41dad7bc4bf13fac46657b" mdapi_config_hash="2fe32bdaf82fc66774ee95c33a23ea88" id="398a4268-ef6f-4ffc-b55f-3c7b5363ce61" chipset="kblgt2" name="VMEPipe" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="5f4afc2f159098e96b8fd90a85979ae3" id="baa3c7e4-52b6-4b85-801e-465a94b746dd" chipset="kblgt2" name="TestOa" />
+    <guid config_hash="d36b63d76294172be0ad5e6530109d06" mdapi_config_hash="aa4c1ab961a066b0bc98bf914735b6af" id="6c66fe6e-2988-454a-bfae-7fca3bbcbec2" chipset="kblgt2" name="GpuBusyness" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="b49aa434-4958-4d98-9e6f-443ff27ca74d" chipset="kblgt2" name="PMA_Stall" />
+    <guid config_hash="73805d7acd1298aa6d81d3e2278ee411" mdapi_config_hash="9111e46468492c1c14a331510c18a49b" id="17b4f3e0-d578-4ae3-b7a8-98d756d1e0df" chipset="kblgt3" name="RenderBasic" />
+    <guid config_hash="e337295245fb93eccf7b096f2728ca98" mdapi_config_hash="f56077c263fafefe554173ce024b2827" id="9823aaa1-b06f-40ce-884b-cd798c79f0c2" chipset="kblgt3" name="ComputeBasic" />
+    <guid config_hash="01f86f590b9b0c0371b0075a5e73b902" mdapi_config_hash="808e46d786103380f58d1e8f91402c4c" id="c7c735f3-ce58-45cf-aa04-30b183f1faff" chipset="kblgt3" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="f810d7343822b3a3b9e50820708bfcb3" id="96ec2219-040b-428a-856a-6bc03363a057" chipset="kblgt3" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="af6cd36da93a8ec66d57ba6b504b601f" id="03372b64-4996-4d3b-aa18-790e75eeb9c2" chipset="kblgt3" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="c4d070800ff5b65caff35d40adb52d04" id="31b4ce5a-bd61-4c1f-bb5d-f2e731412150" chipset="kblgt3" name="ComputeExtended" />
+    <guid config_hash="33bdd2160049aa831e025e1be7a453c5" mdapi_config_hash="dcedeef0d1a6b20eaa3f3ee546b048ed" id="2ce0911a-27fc-4887-96f0-11084fa807c3" chipset="kblgt3" name="ComputeL3Cache" />
+    <guid config_hash="c8739d6465605b9228ec2ff3ebde2ba3" mdapi_config_hash="3a893043b806be4b00179663f8f4695e" id="b128f45f-bfa2-4991-aadc-05be7898e398" chipset="kblgt3" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="b97b4654b688f69b1df22e7d9cd08f2b" id="f3566b55-9c13-47bf-8327-4a887af75262" chipset="kblgt3" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="f8870bc48196bdc7c3d08bf0dba3e377" id="7b21aa68-9076-4ab4-8a84-e45a06c8eac6" chipset="kblgt3" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="2091a23cf2f835375430e16328f73c7b" id="71b4b9dd-ae28-48ce-9a1a-5431e1f23afd" chipset="kblgt3" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="6c748481e5e43019bbeb0557c309b65e" id="52c646ca-52da-4853-877e-8645e73ed330" chipset="kblgt3" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="c1ea12cf95f7c8be3ca32c6670c15a27" id="c4bb682f-677c-4875-990b-005230be87b4" chipset="kblgt3" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="20f9812e7c1c94a2b24dbb6a0596b5e1" id="ade8521b-5e72-45d4-8c25-d9f0da774899" chipset="kblgt3" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="25e39a0a38a1fdbf4e2ff677aad30fc6" id="9df2815d-4e9e-417f-bde1-3788dc6e1ea1" chipset="kblgt3" name="TDL_2" />
+    <guid config_hash="f543908db2541ef48f35603e35c379bd" mdapi_config_hash="41ebe4b58e504d63d60141faa9d45c18" id="efc497ac-884e-4ee4-a4a8-15fba22aaf21" chipset="kblgt3" name="ComputeExtra" />
+    <guid config_hash="16c6718fd82aaa5e1187df8d88ace152" mdapi_config_hash="d0ce6de1ad831394a048015990e82864" id="bfd9764d-2c5b-4c16-bfc1-89de3ca10917" chipset="kblgt3" name="VMEPipe" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="817cb7526b5399e772ed721e062325b3" id="f1792f32-6db2-4b50-b4b2-557128f1688d" chipset="kblgt3" name="TestOa" />
+    <guid config_hash="de8530fdc36d260415e78771e8cc6929" mdapi_config_hash="3f82064fe17d6d7005b6e5c4bb828c5a" id="b55ecba1-2aa9-422e-89ff-b9e30f03d447" chipset="kblgt3" name="GpuBusyness" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="85bc2e4f-2563-4388-921b-dc0dad879cf3" chipset="kblgt3" name="PMA_Stall" />
+    <guid config_hash="c01efa1ec2a11ea9aaab8b0a8e548174" mdapi_config_hash="7867725687bd177e4e8b8b8443b04355" id="d72df5c7-5b4a-4274-a43f-00b0fd51fc68" chipset="glk" name="RenderBasic" />
+    <guid config_hash="cde046a01aba9c56d6fa44bf2c0f26c2" mdapi_config_hash="84d270fda538f1061067316b19b9cac9" id="814285f6-354d-41d2-ba49-e24e622714a0" chipset="glk" name="ComputeBasic" />
+    <guid config_hash="1669463a6836f6d057cbf3e41506923b" mdapi_config_hash="66b8f785edc91d1cf3952fc842114671" id="07d397a6-b3e6-49f6-9433-a4f293d55978" chipset="glk" name="RenderPipeProfile" />
+    <guid config_hash="f9eee3f0c9653ffd05e4876be0ea44d5" mdapi_config_hash="1056f30306a4c2d08d57e4faa86f983a" id="1a356946-5428-450b-a2f0-89f8783a302d" chipset="glk" name="MemoryReads" />
+    <guid config_hash="03e840f1d8597b3c6c4015792243ce7d" mdapi_config_hash="3a432ab2a6296f25755c1846385fae55" id="5299be9d-7a61-4c99-9f81-f87e6c5aaca9" chipset="glk" name="MemoryWrites" />
+    <guid config_hash="39a03c065f1fdb5bf680207dc520cdb2" mdapi_config_hash="ed01dd3479766a5fb38dd8e9e064786e" id="bc9bcff2-459a-4cbc-986d-a84b077153f3" chipset="glk" name="ComputeExtended" />
+    <guid config_hash="c241c2999f487dc995cecdb35b01197b" mdapi_config_hash="3a74134eedb02e201197da17e0940351" id="88ec931f-5b4a-453a-9db6-a61232b6143d" chipset="glk" name="ComputeL3Cache" />
+    <guid config_hash="37dc8ae76c2554b11ecea682f1349ece" mdapi_config_hash="fd61133e8762cb61d142a12604442177" id="0329ea02-ebb8-43f1-bf89-c5bdcccd3eb4" chipset="glk" name="HDCAndSF" />
+    <guid config_hash="d159b7f14e97660ae2887e4b610d2721" mdapi_config_hash="fe48f1232b010e9d10ab1bff0e6efb75" id="5e57a25a-1d18-4e94-b84b-08ea66751b8c" chipset="glk" name="L3_1" />
+    <guid config_hash="1dc29cbbceb8e2e1a78d679ead80a27b" mdapi_config_hash="2a635538209cc68b2c489d2326017539" id="f0652373-d361-426f-b36d-9ffec288bdc6" chipset="glk" name="RasterizerAndPixelBackend" />
+    <guid config_hash="0b9e45ed32513193354be363e288b6a6" mdapi_config_hash="593e37453b96243ac7752d9c45672c63" id="6ac97d12-ce13-428a-b20c-6902bde2608b" chipset="glk" name="Sampler" />
+    <guid config_hash="3f01b8d28fa285e7a496081574de4c1b" mdapi_config_hash="af87c7792e604a645dacdadb99c4afd2" id="59ea703a-9a35-4aed-a985-0d9ab7aceaba" chipset="glk" name="TDL_1" />
+    <guid config_hash="0c77cba2d8886c18df9f382ce90eac66" mdapi_config_hash="2e2beadb54378ff4d79bf4cf15bffd90" id="f2d6d718-e7b1-48f4-9624-45230d2fe2a0" chipset="glk" name="TDL_2" />
+    <guid config_hash="a19a55aad269ccc1ed4380314eda4bed" mdapi_config_hash="ac34c2028f3f4fae92e58aae1496901b" id="15274c82-27d2-4819-876a-7cb1a2c59ba4" chipset="glk" name="ComputeExtra" />
+    <guid config_hash="e018d083414e4d28e0ed481554128883" mdapi_config_hash="dce59e977ffff25a57f2486f5d9a7c60" id="dd3fd789-e783-4204-8cd0-b671bbccb0cf" chipset="glk" name="TestOa" />
+    <guid config_hash="6d13f443205926fd1351ae5adeae8965" mdapi_config_hash="24f384a77963d7d64c324b3d89eeb498" id="e6868953-fb47-431d-a060-f785916558fc" chipset="glk" name="PMA_Stall" />
+    <guid config_hash="afbe2cb999a8303f52eea075f3b8687e" mdapi_config_hash="8e8f1f5eb1b0a95dada8e3ddd78f4dd8" id="7fa796a4-0c7a-4201-afc6-cff0b2f528a2" chipset="cflgt2" name="RenderBasic" />
+    <guid config_hash="e337295245fb93eccf7b096f2728ca98" mdapi_config_hash="9d5a7e8dd6290726416c3b40bba653ff" id="dc8cf7ea-26b4-4478-ac93-dab174f92ac0" chipset="cflgt2" name="ComputeBasic" />
+    <guid config_hash="01f86f590b9b0c0371b0075a5e73b902" mdapi_config_hash="f9a35b936db9a2f76b69d7b5bd5d10ec" id="2221e4d5-ed7b-445e-b2cc-3de1b97f4d42" chipset="cflgt2" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="8b1e5617e61646d7d7d0361107ec2b67" id="82096a90-e2fa-4f38-ac14-562b2496933a" chipset="cflgt2" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="2cd637a11aacc15af119c9dba70c5f1d" id="9f638880-02e9-4a8d-896a-7670a3bf0d35" chipset="cflgt2" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="5311aa266d0d85e7b67695731408ec3e" id="8d4ad934-7c16-43d5-845a-51067a4c8e2f" chipset="cflgt2" name="ComputeExtended" />
+    <guid config_hash="33bdd2160049aa831e025e1be7a453c5" mdapi_config_hash="019cd29f8fe235d7dca74e7860dafc08" id="4389cf07-1424-4963-b2d2-64fcec75406d" chipset="cflgt2" name="ComputeL3Cache" />
+    <guid config_hash="5736948ed298fd6e8cc80222e1e03077" mdapi_config_hash="4118768c8cfd35668067034b646a99ea" id="ac544b3a-ff78-46ea-9808-ee6fef0978b4" chipset="cflgt2" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="fe8bb34c7f8bb873a55e7b7046ec4507" id="a35c5867-0ab8-4d45-8fc1-eb0906f0eff5" chipset="cflgt2" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="d4b1fe90832f2ab808b5dc6d6f2de431" id="bb4bcce9-2cbb-4818-9e49-67ce2c99cd25" chipset="cflgt2" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="0a733ec395a9f95c9a4c7a53639352aa" id="9e1229f8-d87f-4f44-b067-3544e17195aa" chipset="cflgt2" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="86e99a03089772a7bff973a24bbcb21f" id="3e91908a-1c70-4004-b2ab-a10ef14f24f9" chipset="cflgt2" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="07cab9aa8c9c07b346ce2e8976ef87fa" id="9a6ba957-7955-4a09-a8ce-083030ba3c1f" chipset="cflgt2" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="8e2985ac9a60942987f94a397bfeb2ff" id="c54e7ca3-c60c-4396-ac3d-f9899c9a6ee4" chipset="cflgt2" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="775f1d07ed4d225976adf356e8dc9df5" id="e438cd5d-1da7-46c6-9823-4780f370d11d" chipset="cflgt2" name="TDL_2" />
+    <guid config_hash="483a06910590c1753a0266ef8b9f9b70" mdapi_config_hash="4be337ed83e3c95aebf66553ed685602" id="5f679fb0-909e-4c0e-b4b2-8e801f83e71b" chipset="cflgt2" name="ComputeExtra" />
+    <guid config_hash="784698b7fb41dad7bc4bf13fac46657b" mdapi_config_hash="2fe32bdaf82fc66774ee95c33a23ea88" id="0d09ba9a-1d1c-457d-83e2-74ac448014d6" chipset="cflgt2" name="VMEPipe" />
+    <guid config_hash="d36b63d76294172be0ad5e6530109d06" mdapi_config_hash="aa4c1ab961a066b0bc98bf914735b6af" id="e2f162ae-5732-4af0-8b11-69510f57094a" chipset="cflgt2" name="GpuBusyness" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="5f4afc2f159098e96b8fd90a85979ae3" id="74fb4902-d3d3-4237-9e90-cbdc68d0a446" chipset="cflgt2" name="TestOa" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="5ccbf9fb-6bf2-456b-a749-bdff7b1aff13" chipset="cflgt2" name="PMA_Stall" />
+    <guid config_hash="73805d7acd1298aa6d81d3e2278ee411" mdapi_config_hash="5d3d4bcf1e36569409cfd84a7e137ade" id="b316bcab-212f-4228-97de-af6b5a1a2ea1" chipset="cflgt3" name="RenderBasic" />
+    <guid config_hash="e337295245fb93eccf7b096f2728ca98" mdapi_config_hash="0860a8d90a0aa24c5e766b1062dc9af6" id="607f9cc8-e026-4d5f-bfad-45c77eabc150" chipset="cflgt3" name="ComputeBasic" />
+    <guid config_hash="01f86f590b9b0c0371b0075a5e73b902" mdapi_config_hash="498feca145a69e7fcec55b79d239d005" id="9875e050-b1bc-45e6-a6ab-665594601df9" chipset="cflgt3" name="RenderPipeProfile" />
+    <guid config_hash="0a75401250565ee5a0e555b47bc9e5b4" mdapi_config_hash="610a6fcb593c50362beb8c0e2172685a" id="49c65f34-e625-4ca4-86b7-88693e624d4c" chipset="cflgt3" name="MemoryReads" />
+    <guid config_hash="2ed5869dae575556e0895b0d0081555c" mdapi_config_hash="d3b21fcad90e080ef31d74b9ebd6f9ba" id="45c9e8ee-2998-4d83-88e8-9cb7e03287bf" chipset="cflgt3" name="MemoryWrites" />
+    <guid config_hash="6566c55fdf1de8ae73008029a674ecc9" mdapi_config_hash="7c26cd39edceac6865beb355592d2bea" id="bac415ce-d7a2-4f8d-9b16-834deba7330e" chipset="cflgt3" name="ComputeExtended" />
+    <guid config_hash="33bdd2160049aa831e025e1be7a453c5" mdapi_config_hash="1013698045cad3a9935f5cd76ceb8331" id="a8cfca44-0e74-4338-9e57-3daad98957dd" chipset="cflgt3" name="ComputeL3Cache" />
+    <guid config_hash="c8739d6465605b9228ec2ff3ebde2ba3" mdapi_config_hash="6c4d2ca081899cddb7c730b7c9e11b35" id="c4bee67c-0de6-4bc2-9900-5388dcc8adca" chipset="cflgt3" name="HDCAndSF" />
+    <guid config_hash="3ead5919c426a00ef6697e21df33ef07" mdapi_config_hash="74d87a1c8c2eb43fc0d481a88e635cc4" id="2f77a650-54a6-4777-98dc-e49000c13ceb" chipset="cflgt3" name="L3_1" />
+    <guid config_hash="2d0a88cdba58ddf18642fde563edb4d8" mdapi_config_hash="e2ccd67d442ca19acc63a9b3556ce2cb" id="61cf6b31-9ddd-4deb-bae5-7339dd1f63b3" chipset="cflgt3" name="L3_2" />
+    <guid config_hash="d3972886309fa3701f3d3ae185f57cbe" mdapi_config_hash="fda9efbaddee05cf0c58b0b5ba63267a" id="1421ea8b-a4c9-4383-922a-60ba96c42f24" chipset="cflgt3" name="L3_3" />
+    <guid config_hash="90ecbd5ae5ae6d3c0f756c7411351c85" mdapi_config_hash="04d6c2564113599d8375138bcf87e0a5" id="6e1f0a90-c65f-4da9-86d0-c79b3c0063f6" chipset="cflgt3" name="RasterizerAndPixelBackend" />
+    <guid config_hash="5a628cbf246226c19fed41479cf17de1" mdapi_config_hash="9aa750e153f190ac1aeb54a87f778c8f" id="7cb05eab-0857-4189-93bc-09326d298637" chipset="cflgt3" name="Sampler" />
+    <guid config_hash="f48609e1a79093073b96726c3c4c63a6" mdapi_config_hash="88333263dd73a05cb7df643794d2eefa" id="05a06d02-0c12-486b-bb1d-9be053848980" chipset="cflgt3" name="TDL_1" />
+    <guid config_hash="93ab6cf80fefdfca540a3ac101925411" mdapi_config_hash="6750a43049c53c8cb8f966764bf7cf8f" id="cddbd1dc-41a2-4fe4-8b05-3d2773120814" chipset="cflgt3" name="TDL_2" />
+    <guid config_hash="f543908db2541ef48f35603e35c379bd" mdapi_config_hash="e3197d98aa86acaf090f1bffde854586" id="e61ae394-9d9e-4204-a735-1dad7e44d953" chipset="cflgt3" name="ComputeExtra" />
+    <guid config_hash="16c6718fd82aaa5e1187df8d88ace152" mdapi_config_hash="d0ce6de1ad831394a048015990e82864" id="94272ad9-45ee-4e34-b7a7-51546cd6405c" chipset="cflgt3" name="VMEPipe" />
+    <guid config_hash="de8530fdc36d260415e78771e8cc6929" mdapi_config_hash="3f82064fe17d6d7005b6e5c4bb828c5a" id="22b7e0c2-cade-425f-b099-34479768c72a" chipset="cflgt3" name="GpuBusyness" />
+    <guid config_hash="cca1580576ffa8e25aa271ebdac68cc7" mdapi_config_hash="228710e94277d74bd4be0c2536a3edd4" id="577e8e2c-3fa0-4875-8743-3538d585e3b0" chipset="cflgt3" name="TestOa" />
+    <guid config_hash="8ae5bda74271c473f88f13e57d6f6828" mdapi_config_hash="4d9fb617c64406cc8b372808461dd3e3" id="c11af8d1-858b-4f8b-98fb-8d683ba8bda0" chipset="cflgt3" name="PMA_Stall" />
+    <guid config_hash="428ad0859c9dac4ba85dd73106f5b2de" mdapi_config_hash="7baf473e87d0838b628bd2ed289f4783" id="2d975e19-7130-41d2-b06f-79d74f91e7c8" chipset="cnl" name="RenderBasic" />
+    <guid config_hash="7365cff2873ed22304dcb350ca19d834" mdapi_config_hash="174f9ff2125d06a7886a258304ba4eae" id="eed14f91-5f03-4e3a-8281-ac38030ac573" chipset="cnl" name="ComputeBasic" />
+    <guid config_hash="1878c620a9f0cc5100fba47c83a1457c" mdapi_config_hash="f1baa55e099488db74fd02c9560df40b" id="0666ccac-f5aa-4dc2-aa12-c6e058f383f3" chipset="cnl" name="RenderPipeProfile" />
+    <guid config_hash="10d83436d03f71bc19e6b83739072556" mdapi_config_hash="7f0796f55071a69b76c0a0615b2171e6" id="3500dcfd-837b-4ec8-b5cf-fe58b966263f" chipset="cnl" name="MemoryReads" />
+    <guid config_hash="e1c4bd09bd777f97d6c6491bf921ec6b" mdapi_config_hash="92754b4c69ef3427efdee08033daf7e2" id="63d18ead-3cfc-4972-a640-5e98b688dfee" chipset="cnl" name="MemoryWrites" />
+    <guid config_hash="01c5575fa201196b2a4b708001ef810f" mdapi_config_hash="f7fc9c2349a53c37bd020660a0990356" id="1b4d1280-6bbd-4d57-90c6-a03ed6059688" chipset="cnl" name="ComputeExtended" />
+    <guid config_hash="21c0efc6587cd42844e23251b3712b72" mdapi_config_hash="c3d136f1cda81821d08595bc4c29973a" id="f3b31b5a-00b3-4fb4-81fd-6446e505534c" chipset="cnl" name="ComputeL3Cache" />
+    <guid config_hash="0813a24fac91efc4f1dfb7dbb578f08d" mdapi_config_hash="417896f2fec55d50f844eb2344287731" id="890094c5-8615-4f69-a8b9-706c5bcbd713" chipset="cnl" name="HDCAndSF" />
+    <guid config_hash="fb9e04dafcf3519c30c215cb2094a881" mdapi_config_hash="65bd9bbb664fd329464d18e07dd9ac47" id="e56f7dd7-ff55-4bae-89a1-a526a2e3b0d6" chipset="cnl" name="L3_1" />
+    <guid config_hash="28ade5f07e44ef07814f7a307a06470c" mdapi_config_hash="24f525009f45d22253ff7c09951733c9" id="918834e2-a1a4-4d77-9f3a-0c229f8d803f" chipset="cnl" name="L3_2" />
+    <guid config_hash="7f9fb1f70df8efb8cbd236ee8920c349" mdapi_config_hash="20e9d5975e60292c3aaecfc766d2d960" id="2e95713a-c6d8-47a9-9207-eba3e208be51" chipset="cnl" name="RasterizerAndPixelBackend" />
+    <guid config_hash="c6bda99f4d7656d8b1b613c17c2d53da" mdapi_config_hash="2c48df889c497b3f97d5a350827d8f05" id="9bcf4ff2-c15f-4bea-8ec8-8db87791942e" chipset="cnl" name="Sampler" />
+    <guid config_hash="4bfffb81b9376af931bad919fc66ef3f" mdapi_config_hash="33d7ba5d98519f3038ed07f273fe5f91" id="c46c7bb5-f26d-4634-b491-902394af85b1" chipset="cnl" name="TDL_1" />
+    <guid config_hash="e5419b6c232500a6a824c2c58f3b7d32" mdapi_config_hash="b9a01044b9befe9fcf952f26ba4fcc4e" id="aa2d6ab4-99b3-42f8-94d6-4a9aa2baedaf" chipset="cnl" name="TDL_2" />
+    <guid config_hash="ccb9fdae1fe1f44c4c32bdc69befc160" mdapi_config_hash="9cf34989f5e721e734d4edf26036c2c5" id="db41edd4-d8e7-4730-ad11-b9a2d6833503" chipset="cnl" name="TestOa" />
+    <guid config_hash="eaaf4df3ac5e9b4fd52d980f0be72dbf" mdapi_config_hash="8ef6088f425f2a97b01bed560ad6e2b3" id="193093b2-da24-49bf-b407-442c213b71b4" chipset="icl" name="RenderBasic" />
+    <guid config_hash="6b23eee815d02e770dc7e79d2246124f" mdapi_config_hash="460d90c501e2a66273fd830b7a01812d" id="233a477b-f8f0-40f4-bf57-01440c3701d9" chipset="icl" name="ComputeBasic" />
+    <guid config_hash="3b6635eb3709f346076901ea88ec1f2b" mdapi_config_hash="402f156b276dfaaaf84eb09ec5347515" id="43eb7fc1-dc5e-45e2-a90a-0053f5397271" chipset="icl" name="ComputeExtended" />
+    <guid config_hash="82f99a59ec47e807d35dde01c4013d02" mdapi_config_hash="ccc13942b8756edc6055bb06bee51a46" id="022b8913-ae9f-4559-abcd-583e586170d0" chipset="icl" name="ComputeL3Cache" />
+    <guid config_hash="34c5bc89788487e6d32ea9894929b1ae" mdapi_config_hash="0b8dc07dcfe3a03bf65771ee8404fa10" id="03c7a167-2abc-4ba6-878a-f1d80082abca" chipset="icl" name="RenderPipeProfile" />
+    <guid config_hash="dfb00108bfdc1c652f9550bf5ec9262f" mdapi_config_hash="9b4b61a06cf60de356d48995441e6724" id="c5cbc488-6569-41dd-9128-42bf6f0d317c" chipset="icl" name="HDCAndSF" />
+    <guid config_hash="8818a97d48d99673e220075b0ba71eb3" mdapi_config_hash="d3e8cc994e923fc2f79f086273b62ece" id="0316ce4f-e03f-4738-8262-13528fce8eea" chipset="icl" name="RasterizerAndPixelBackend" />
+    <guid config_hash="e1436790af3b1bbea5a0262704c213b1" mdapi_config_hash="7b7377687e294a3c2ee88e0715a65f01" id="21d69ec3-91e1-48a8-acd6-c0c4ec6e819a" chipset="icl" name="L3_1" />
+    <guid config_hash="5ef586cc746e34ab542586805cb26c8e" mdapi_config_hash="06190180046d22f3155558f2211abc30" id="e60e9155-6830-4aec-baf2-1c3c15a73869" chipset="icl" name="L3_2" />
+    <guid config_hash="abdae7b3820fd860c6fec7a98f9654bf" mdapi_config_hash="5cf54f89d0c9ebeeebc46bfde154fdf2" id="47c364d5-1799-4d17-9447-add9358c6451" chipset="icl" name="L3_3" />
+    <guid config_hash="8b3ca983367a86a4dc4c80fe2a4cfbbb" mdapi_config_hash="397319e33a2d28c3602837be8737b559" id="e5ab5c08-3130-4469-8eaf-b23d3dc817d4" chipset="icl" name="L3_4" />
+    <guid config_hash="c5b76b0b898d48bd6305b7208f338584" mdapi_config_hash="9870c08d2dbb2de9836e8effdc5074a8" id="6cdf23c1-f725-414c-959a-c90fa5571b1f" chipset="icl" name="L3_5" />
+    <guid config_hash="667224b11f675b2ac565e18624fad738" mdapi_config_hash="e49091662060a5c502da58bd613abc7f" id="51a2eb6d-9fad-4489-8f22-ab845fe7882a" chipset="icl" name="Sampler_1" />
+    <guid config_hash="e6910b0739c288d68194e64933845380" mdapi_config_hash="d55ee03d24efe992a4029534908c2550" id="afc0f021-8c33-4d60-803d-93487f96c7c1" chipset="icl" name="Sampler_2" />
+    <guid config_hash="525a9fe5285599f695330c45ba2e8b62" mdapi_config_hash="6aa36798625267734b4d066d9090c0bd" id="eddc2f32-b196-4a72-9bf8-21770e35f8bd" chipset="icl" name="TDL_1" />
+    <guid config_hash="b141825840f912e9d7c98a13ae34d600" mdapi_config_hash="af8ee9d86606564460ce2928023e47a5" id="c6d3af7b-037b-4656-95e1-4f838f0a2c14" chipset="icl" name="TDL_2" />
+    <guid config_hash="d2188fa3c865ef430532b127a3fd87a5" mdapi_config_hash="ff33e47c767f6f81d9a779153aae6fdb" id="fd25ec19-3ed1-40c9-8648-1d2387449a92" chipset="icl" name="TDL_3" />
+    <guid config_hash="b421b29d8557dbbf0fe3068c82b3d8dd" mdapi_config_hash="cc850ab4463c23e6017f069d67785c31" id="40dc79f2-88c8-47c6-8f86-f509e39fbe5d" chipset="icl" name="GpuBusyness" />
+    <guid config_hash="7480125fc0806a347f975dc714568e92" mdapi_config_hash="c6b1c7a22e3c2f456cbfdae1bfe394ac" id="3c0bf614-5d67-4326-887f-a24eb8a58244" chipset="icl" name="TestOa" />
+</guids>
diff --git a/lib/i915/perf-configs/mdapi-xml-convert.py b/lib/i915/perf-configs/mdapi-xml-convert.py
new file mode 100755
index 00000000..43cb1bf1
--- /dev/null
+++ b/lib/i915/perf-configs/mdapi-xml-convert.py
@@ -0,0 +1,1000 @@
+#!/usr/bin/env python2
+
+# Copyright (C) 2015-2016 Intel Corporation
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+
+# "MDAPI" xml files are an XML schema for maintaining meta data about Gen
+# graphics Ovservability counters, where MD API is the name of a library shared
+# by Intel GPA and Intel VTune.
+#
+# These files aren't publicly documented and have some historical baggage that
+# adds some complexity as well as being inconsistent in a number of ways that
+# makes it quite a bit of effort to parse/use the data. We also don't have
+# guarantees about how this schema is maintained.
+#
+# We've taken the opportunity to find ways to simplify the input data and to
+# make it more consistent to hopefully reduce the effort involved in using the
+# data downstream.
+#
+
+
+import argparse
+import copy
+import hashlib
+from operator import itemgetter
+import re
+import sys
+import time
+import uuid
+
+import xml.etree.ElementTree as et
+import xml.sax.saxutils as saxutils
+
+import pylibs.oa_guid_registry as oa_registry
+
+
+# MDAPI configs include writes to some non-config registers,
+# thus the blacklists...
+
+gen8_11_chipset_params = {
+    'a_offset': 16,
+    'b_offset': 192,
+    'c_offset': 224,
+    'oa_report_size': 256,
+    'config_reg_blacklist': {
+        0x2364, # OACTXID
+    },
+}
+
+chipsets = {
+    'HSW': {
+        'a_offset': 12,
+        'b_offset': 192,
+        'c_offset': 224,
+        'oa_report_size': 256,
+        'registers': {
+            # TODO extend the symbol table for nicer output...
+                0x2710: { 'name': 'OASTARTTRIG1' },
+            0x2714: { 'name': 'OASTARTTRIG1' },
+            0x2718: { 'name': 'OASTARTTRIG1' },
+            0x271c: { 'name': 'OASTARTTRIG1' },
+            0x2720: { 'name': 'OASTARTTRIG1' },
+            0x2724: { 'name': 'OASTARTTRIG6' },
+            0x2728: { 'name': 'OASTARTTRIG7' },
+            0x272c: { 'name': 'OASTARTTRIG8' },
+            0x2740: { 'name': 'OAREPORTTRIG1' },
+            0x2744: { 'name': 'OAREPORTTRIG2' },
+            0x2748: { 'name': 'OAREPORTTRIG3' },
+            0x274c: { 'name': 'OAREPORTTRIG4' },
+            0x2750: { 'name': 'OAREPORTTRIG5' },
+            0x2754: { 'name': 'OAREPORTTRIG6' },
+            0x2758: { 'name': 'OAREPORTTRIG7' },
+            0x275c: { 'name': 'OAREPORTTRIG8' },
+            0x2770: { 'name': 'OACEC0_0' },
+            0x2774: { 'name': 'OACEC0_1' },
+            0x2778: { 'name': 'OACEC1_0' },
+            0x277c: { 'name': 'OACEC1_1' },
+            0x2780: { 'name': 'OACEC2_0' },
+            0x2784: { 'name': 'OACEC2_1' },
+            0x2788: { 'name': 'OACEC3_0' },
+            0x278c: { 'name': 'OACEC3_1' },
+            0x2790: { 'name': 'OACEC4_0' },
+            0x2794: { 'name': 'OACEC4_1' },
+            0x2798: { 'name': 'OACEC5_0' },
+            0x279c: { 'name': 'OACEC5_1' },
+            0x27a0: { 'name': 'OACEC6_0' },
+            0x27a4: { 'name': 'OACEC6_1' },
+            0x27a8: { 'name': 'OACEC7_0' },
+            0x27ac: { 'name': 'OACEC7_1' },
+        },
+        'config_reg_blacklist': {
+            0x2364, # OASTATUS1 register
+        },
+    },
+    'BDW': gen8_11_chipset_params,
+    'CHV': gen8_11_chipset_params,
+    'SKLGT2': gen8_11_chipset_params,
+    'SKLGT3': gen8_11_chipset_params,
+    'SKLGT4': gen8_11_chipset_params,
+    'BXT': gen8_11_chipset_params,
+    'KBLGT2': gen8_11_chipset_params,
+    'KBLGT3': gen8_11_chipset_params,
+    'GLK': gen8_11_chipset_params,
+    'CFLGT2': gen8_11_chipset_params,
+    'CFLGT3': gen8_11_chipset_params,
+    'CNL': gen8_11_chipset_params,
+    'ICL': gen8_11_chipset_params,
+}
+
+register_types = { 'OA', 'NOA', 'FLEX', 'PM' }
+
+default_set_blacklist = { "RenderDX1x", # TODO: rename to something non 'DX'
+                                        # specific if this config is generally
+                                        # usefull
+                          "RenderBalance", # XXX: missing register config
+                        }
+
+counter_blacklist = {
+    "DramLlcThroughput", # TODO: The max equation of this counter
+                         # requires dram throughtput value. Need to
+                         # investiguate how to get this value.
+}
+
+sys_vars = { "EuCoresTotalCount",
+             "EuSlicesTotalCount",
+             "SamplersTotalCount",
+             "EuThreadsCount",
+             "GpuMinFrequencyMHz",
+             "GpuMaxFrequencyMHz",
+             "GpuTimestampFrequency",
+             "SliceMask",
+             "SubsliceMask",
+             "EuSubslicesTotalCount"
+           }
+
+def underscore(name):
+    s = re.sub('MHz', 'Mhz', name)
+    s = re.sub('\.', '_', s)
+    s = re.sub('(.)([A-Z][a-z]+)', r'\1_\2', s)
+    return re.sub('([a-z0-9])([A-Z])', r'\1_\2', s).lower()
+
+def print_err(*args):
+    sys.stderr.write(' '.join(map(str,args)) + '\n')
+
+read_register_offsets = {
+    0x1f0: 'PERFCNT1',
+    0x1f8: 'PERFCNT2',
+}
+
+def read_value(chipset, offset):
+    if offset in read_register_offsets:
+        return read_register_offsets[offset]
+    print_err("Unknown offset register at offset {0}".format(offset))
+    assert 0
+
+
+def read_token_to_rpn_read(chipset, token, raw_offsets):
+    width, offset_str = token.split('@')
+
+    # For Broadwell the raw read notation was extended for 40 bit
+    # counters: rd40@<32bit_part1_offset>:<8bit_part2_offset>
+    if width == "rd40":
+        offset_32_str, offset_8_str = offset_str.split(':')
+        offset_str = offset_32_str
+
+    offset = int(offset_str, 16)
+
+    if raw_offsets:
+        a_offset = chipsets[chipset]['a_offset']
+        b_offset = chipsets[chipset]['b_offset']
+        c_offset = chipsets[chipset]['c_offset']
+        report_size = chipsets[chipset]['oa_report_size']
+
+        if offset < a_offset:
+            if offset == 4:
+                return "GPU_TIME 0 READ"
+            elif offset == 12:
+                assert chipset != "HSW" # Only for Gen8+
+                return "GPU_CLOCK 0 READ"
+            else:
+                assert 0
+        elif offset < b_offset:
+            return "A " + str((offset - a_offset) / 4) + " READ"
+        elif offset < c_offset:
+            return "B " + str((offset - b_offset) / 4) + " READ"
+        elif offset < report_size:
+            return "C " + str((offset - c_offset) / 4) + " READ"
+        else:
+            return "{0} READ_REG".format(read_value(chipset, offset))
+    else:
+        idx = offset / 8
+        if chipset == "HSW":
+            # On Haswell accumulated counters are assumed to start
+            # with GPU_TIME followed by 45 A counters, then 8 B
+            # counters and finally 8 C counters.
+            if idx < 1:
+                return "GPU_TIME 0 READ"
+            elif idx < 46:
+                return "A " + str(idx - 1) + " READ"
+            elif idx < 54:
+                return "B " + str(idx - 46) + " READ"
+            elif idx < 62:
+                return "C " + str(idx - 54) + " READ"
+            else:
+                return "{0} READ_REG".format(read_value(chipset, offset))
+        else:
+            # For Gen8+ the array of accumulated counters is
+            # assumed to start with a GPU_TIME then GPU_CLOCK,
+            # then 36 A counters, then 8 B counters and finally
+            # 8 C counters.
+            if idx == 0:
+                return "GPU_TIME 0 READ"
+            elif idx == 1:
+                return "GPU_CLOCK 0 READ"
+            elif idx < 38:
+                return "A " + str(idx - 2) + " READ"
+            elif idx < 46:
+                return "B " + str(idx - 38) + " READ"
+            elif idx < 54:
+                return "C " + str(idx - 46) + " READ"
+            else:
+                return "{0} READ_REG".format(read_value(chipset, offset))
+
+    assert 0
+
+def replace_read_tokens_with_rpn_read_ops(chipset, equation, raw_offsets):
+    # MDAPI MetricSet equations use tokens like 'dw at 0xff' for reading raw
+    # values from snapshots, but this doesn't seem convenient for a few
+    # reasons:
+    #
+    # 1) The offsets hide the particular a, b, or c counter they
+    #    correspond to which in turn makes it awkward to experiment
+    #    with different report sizes which trade off how many a, b and
+    #    c counters are available
+    #
+    # 2) Raw reads could be represented as RPN operations too, and
+    #    the consistency could make them slightly easier for tools to
+    #    handle, E.g:
+    #
+    #      "A 5 READ" = read A counter 5
+    #
+    # We replace dw@ address tokens with GPU_TIME, A, B or C READ ops...
+    #
+
+    tokens = equation.split()
+    equation = ""
+
+    for token in tokens:
+        if '@' in token:
+            read_exp = read_token_to_rpn_read(chipset, token, raw_offsets)
+            equation = equation + " " + read_exp
+        else:
+            equation = equation + " " + token
+
+    return equation
+
+
+parser = argparse.ArgumentParser()
+parser.add_argument("xml", nargs="+", help="XML description of metrics")
+parser.add_argument("--guids", required=True, help="Metric set GUID registry")
+parser.add_argument("--whitelist", help="Only output for given, space-separated, sets")
+parser.add_argument("--blacklist", help="Don't generate anything for given metric sets")
+parser.add_argument("--merge", help="Additional meta data to merge into the result")
+parser.add_argument("--dry-run", action="store_true",
+                    help="Not generate new XML but to check any errors")
+
+args = parser.parse_args()
+
+metrics = et.Element('metrics')
+tree = et.ElementTree(metrics)
+
+def apply_aliases(text, aliases):
+    if aliases == None:
+        return text
+
+    for alias in aliases.split(','):
+        (a, b) = alias.split('|')
+        text = re.sub(r"\b%s\b" % re.escape(a), b, text)
+
+        a = a.lower()
+        b = b.lower()
+        text = re.sub(r"\b%s\b" % re.escape(a), b, text)
+
+    return text
+
+def strip_dx_apis(text):
+    if text == None:
+        return ""
+    stripped = ""
+    apis = text.split()
+    for api in apis:
+        if api[:2] != "DX":
+            stripped = stripped + " " + api
+
+    return stripped.strip()
+
+# For recursively appending counters in order of dependencies...
+def append_deps_and_counter(mdapi_counter, mdapi_counters, deps,
+                            sorted_array, sorted_set):
+    symbol_name = mdapi_counter.get('SymbolName')
+
+    if symbol_name in sorted_set:
+        return
+
+    for dep_name in deps[symbol_name]:
+        if dep_name in mdapi_counters:
+            append_deps_and_counter(mdapi_counters[dep_name], mdapi_counters, deps,
+                                    sorted_array, sorted_set)
+
+    sorted_array.append(mdapi_counter)
+    sorted_set[symbol_name] = mdapi_counter
+
+def sort_counters(mdapi_counters, deps):
+    sorted_array = []
+    sorted_set = {} # counters in here have been added to array
+    for symbol_name in mdapi_counters:
+        append_deps_and_counter(mdapi_counters[symbol_name], mdapi_counters, deps,
+                                sorted_array, sorted_set)
+
+    return sorted_array
+
+def expand_macros(equation):
+    equation = equation.replace('GpuDuration', "$Self 100 UMUL $GpuCoreClocks FDIV")
+    equation = equation.replace('EuAggrDuration', "$Self $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV")
+    return equation
+
+def fixup_equation(equation):
+    if equation is None:
+        return None
+    return equation.replace('$SubliceMask', '$SubsliceMask')
+
+# The MDAPI XML files sometimes duplicate the same Flex EU/OA regs
+# between configs with different AvailabilityEquations even though the
+# availability checks are only expected to affect the MUX configs
+#
+# We iterate all the configs to filter out the FLEX/OA configs and
+# double check that there's never any variations between repeated
+# configs
+#
+def filter_single_config_registers_of_type(mdapi_metric_set, type):
+    regs = []
+    for mdapi_reg_config in mdapi_metric_set.findall("RegConfigStart"):
+        tmp_regs = []
+        for mdapi_reg in mdapi_reg_config.findall("Register"):
+            reg = (int(mdapi_reg.get('offset'),16), int(mdapi_reg.get('value'),16))
+
+            if reg[0] in chipsets[chipset]['config_reg_blacklist']:
+                continue
+
+            if mdapi_reg.get('type') == type:
+                tmp_regs.append(reg)
+
+        if len(tmp_regs) > 0:
+            bad = False
+            if len(regs) == 0:
+                regs = tmp_regs
+            elif len(regs) != len(tmp_regs):
+                bad = True
+            else:
+                for i in xrange(0, len(regs)):
+                    if regs[i] != tmp_regs[i]:
+                        bad = True
+                        break
+            if bad:
+                print_err("ERROR: multiple, differing FLEX/OA configs for one set: MetricSet=\"" + mdapi_metric_set.get('ShortName'))
+                sys.exit(1)
+
+    return regs
+
+
+# We only have a very small number of IDs, but we aren't assuming they
+# start from zero or are contiguous in the MDAPI XML files. Python
+# doesn't seem to have a built in sparse array type so we just
+# loop over the entries we have:
+def get_mux_id_group(id_groups, id):
+    for group in id_groups:
+        if group['id'] == id:
+            return group
+
+    new_group = { 'id': id, 'configs': [] }
+    id_groups.append(new_group)
+
+    return new_group
+
+
+
+def process_mux_configs(mdapi_set):
+    allow_missing_id = True
+
+    mux_config_id_groups = []
+
+    for mdapi_reg_config in mdapi_set.findall("RegConfigStart"):
+
+        mux_regs = []
+        for mdapi_reg in mdapi_reg_config.findall("Register"):
+            address = int(mdapi_reg.get('offset'), 16)
+
+            if address in chipsets[chipset]['config_reg_blacklist']:
+                continue
+
+            reg_type = mdapi_reg.get('type')
+
+            if reg_type not in register_types:
+                print_err("ERROR: unknown register type=\"" + reg_type + "\": MetricSet=\"" + mdapi_set.get('ShortName'))
+                sys.exit(1)
+
+            if reg_type != 'NOA' and reg_type != 'PM':
+                continue
+
+            reg = (address, int(mdapi_reg.get('value'), 16))
+            mux_regs.append(reg)
+
+        if len(mux_regs) == 0:
+            continue
+
+        availability = mdapi_reg_config.get('AvailabilityEquation')
+        if availability == "":
+            availability = None
+
+        if mdapi_reg_config.get('ConfigPriority') != None:
+            reg_config_priority = int(mdapi_reg_config.get('ConfigPriority'))
+        else:
+            reg_config_priority = 0
+
+        if mdapi_reg_config.get('ConfigId') != None:
+            reg_config_id = int(mdapi_reg_config.get('ConfigId'))
+            allow_missing_id = False
+        elif mdapi_reg_config.get('ConfigId') == None and allow_missing_id == True:
+            reg_config_id = 0
+        else:
+            # It will spell trouble if there's a mixture of explicit and
+            # implied config IDs...
+            print_err("ERROR: register configs mixing implied/explicit IDs: MetricSet=\"" + mdapi_set.get('ShortName'))
+            sys.exit(1)
+
+        mux_config = { 'priority': reg_config_priority,
+                       'availability': availability,
+                       'registers': mux_regs }
+
+        mux_config_id_group = get_mux_id_group(mux_config_id_groups, reg_config_id)
+        mux_config_id_group['configs'].append(mux_config)
+
+    mux_config_id_groups.sort(key=itemgetter('id'))
+
+    # The only special case we currently support for more than one group of NOA
+    # MUX configs is for the Broadwell ComputeExtended metric set with two Id
+    # groups and the second just has a single unconditional config that can
+    # logically be appended to all the conditional configs of the first group
+    if len(mux_config_id_groups) > 1:
+        if len(mux_config_id_groups) != 2:
+            print_err("ERROR: Script doesn't currently allow more than two groups of NOA MUX configs for a single metric set: MetricSet=\"" + mdapi_set.get('ShortName'))
+            sys.exit(1)
+
+        last_id_group = mux_config_id_groups[-1]
+        if len(last_id_group['configs']) != 1:
+            print_err("ERROR: Script currently only allows up to two Ids for NOA MUX configs if second Id only contains a single unconditional config: MetricSet=\"" + mdapi_set.get('ShortName'))
+            sys.exit(1)
+
+        tail_config = last_id_group['configs'][0]
+        for mux_config in mux_config_id_groups[0]['configs']:
+            mux_config['registers'] = mux_config['registers'] + tail_config['registers']
+
+        mux_config_id_groups = [mux_config_id_groups[0]]
+
+    if len(mux_config_id_groups) == 0 or mux_config_id_groups[0]['configs'] == 0:
+        print_err("ERROR: MUX register configs missing: MetricSet=\"" + mdapi_set.get('ShortName'))
+        sys.exit(1)
+
+    mux_configs = mux_config_id_groups[0]['configs']
+    assert isinstance(mux_configs, list)
+    assert len(mux_configs) >= 1
+    assert len(mux_configs[0]['registers']) > 1 # > 1 registers
+    return mux_configs
+
+
+def add_register_config(set, priority, availability, regs, type):
+    reg_config = et.SubElement(set, 'register_config')
+
+    reg_config.set('type', type)
+
+    if availability != None:
+        assert type == "NOA"
+        reg_config.set('priority', str(priority))
+        reg_config.set('availability', availability)
+
+    for reg in regs:
+        elem = et.SubElement(reg_config, 'register')
+        elem.set('type', type)
+        elem.set('address', "0x%08X" % reg[0])
+        elem.set('value', "0x%08X" % reg[1])
+
+def to_text(value):
+    if value == None:
+        return ""
+    return value
+
+# There are duplicated metric sets with the same symbol name so we
+# keep track of the sets we've read so we can skip duplicates...
+sets = {}
+
+guids = {}
+
+guids_xml = et.parse(args.guids)
+for guid in guids_xml.findall(".//guid"):
+    hashing_key = oa_registry.Registry.chipset_derive_hash(guid.get('chipset'),
+                                                           guid.get('mdapi_config_hash'))
+    guids[hashing_key] = guid.get('id')
+
+for arg in args.xml:
+    mdapi = et.parse(arg)
+
+    concurrent_group = mdapi.find(".//ConcurrentGroup")
+
+    for mdapi_set in mdapi.findall(".//MetricSet"):
+
+        apis = mdapi_set.get('SupportedAPI')
+        if "OGL" not in apis and "OCL" not in apis and "MEDIA" not in apis:
+            continue
+
+        set_symbol_name = mdapi_set.get('SymbolName')
+
+        if set_symbol_name in sets:
+            print_err("WARNING: duplicate set named \"" + set_symbol_name + "\" (SKIPPING)")
+            continue
+
+        chipset = mdapi_set.get('SupportedHW')
+        if concurrent_group.get('SupportedGT') != None:
+            chipset = chipset + concurrent_group.get('SupportedGT')
+        if chipset not in chipsets:
+            continue
+
+        if args.whitelist:
+            set_whitelist = args.whitelist.split()
+            if set_symbol_name not in set_whitelist:
+                continue
+
+        if args.blacklist:
+            set_blacklist = args.blacklist.split()
+        else:
+            set_blacklist = default_set_blacklist
+        if set_symbol_name in set_blacklist:
+            continue
+
+        assert mdapi_set.get('SnapshotReportSize') == "256"
+
+        set = et.SubElement(metrics, 'set')
+
+        set.set('chipset', chipset)
+
+        set.set('name', mdapi_set.get('ShortName'))
+        set.set('symbol_name', set_symbol_name)
+        set.set('underscore_name', underscore(mdapi_set.get('SymbolName')))
+        set.set('mdapi_supported_apis', strip_dx_apis(mdapi_set.get('SupportedAPI')))
+
+
+        # Look at the hardware register config before looking at the counters.
+        #
+        # The hardware configuration is used as a key to lookup up a GUID which
+        # is used by applications to lookup the corresponding counter
+        # normalization equations.
+        #
+        # We want to skip over any metric sets that don't yet have a registered
+        # GUID in guids.xml.
+
+        # There can be multiple NOA MUX configs, since they may have associated
+        # availability tests to match particular systems.
+        #
+        # Unlike the MDAPI XML files we only support tracking one group of
+        # mutually exclusive MUX configs, whereas the MDAPI XML files
+        # theoretically allow a single metric set to be associated with ordered
+        # groups of mutually exclusive configs. So far there is only one
+        # Broadwell, ComputeExtended metric set which uses this, but that
+        # particular case can be expressed in less general terms.
+        #
+        # Being a bit simpler here should make it easier for downstream tools
+        # to deal with. (At least we got the handling of the Broadwell
+        # ComputeExtended example wrong and it took several email exchanges and
+        # a conference call to confirm how to interpret this case)
+        mux_configs = process_mux_configs(mdapi_set)
+
+        # Unlike for MUX registers, we only expect one set of FLEX/OA
+        # registers per metric set (even though they are sometimes duplicated
+        # between configs in MDAPI XML files.
+        #
+        # This filter function, extracts the register of a certain type but
+        # also double checks that if they are repeated in separate configs that
+        # they don't vary. (Notably the current i915 perf Linux driver would
+        # need some adapting to support multiple OA/FLEX configs with different
+        # availability expressions)
+        #
+        flex_regs = filter_single_config_registers_of_type(mdapi_set, "FLEX")
+        oa_regs = filter_single_config_registers_of_type(mdapi_set, "OA")
+
+
+        # Note: we ignore Perfmon registers
+
+        for mux_config in mux_configs:
+            add_register_config(set, mux_config['priority'], mux_config['availability'], mux_config['registers'], "NOA")
+        if len(oa_regs) > 0:
+            add_register_config(set, 0, None, oa_regs, "OA")
+        if len(flex_regs) > 0:
+            add_register_config(set, 0, None, flex_regs, "FLEX")
+
+        mdapi_hw_config_hash = oa_registry.Registry.mdapi_hw_config_hash(mdapi_set)
+        guid_hash = oa_registry.Registry.chipset_derive_hash(chipset.lower(),
+                                                             mdapi_hw_config_hash)
+        hw_config_hash = oa_registry.Registry.hw_config_hash(set)
+
+        if guid_hash in guids:
+            set.set('hw_config_guid', guids[guid_hash])
+        else:
+            print_err("WARNING: No GUID found for metric set " + chipset + ", " + set_symbol_name + " (SKIPPING)")
+            print_err("WARNING: If this is a new config add the following to guids.xml:")
+            print_err("<guid config_hash=\"" + hw_config_hash + "\" mdapi_config_hash=\"" + mdapi_hw_config_hash + "\" id=\"" + str(uuid.uuid4()) + "\" chipset=\"" + chipset.lower() + "\" name=\"" + set_symbol_name + "\" />")
+            metrics.remove(set)
+            continue
+
+
+        sets[set_symbol_name] = set
+
+        counters = {}
+        normalization_equations = {}
+        raw_equations = {}
+
+        # Awkwardly we can't assume metrics are in dependency order and have to
+        # sort them manually. We start by associating a list of dependencies with
+        # each counter...
+
+        mdapi_counters = {}
+        mdapi_counter_deps = {}
+
+        for mdapi_counter in mdapi_set.findall("Metrics/Metric"):
+            symbol_name = mdapi_counter.get('SymbolName')
+
+            if symbol_name in counter_blacklist:
+                continue;
+
+            # Have seen at least one MetricSet with a duplicate GpuCoreClocks counter...
+            if symbol_name in mdapi_counters:
+                print_err("WARNING: Skipping duplicate counter \"" + symbol_name + \
+                        "\" in " + set.get('name') + " :: " + mdapi_counter.get('ShortName'))
+                continue;
+
+            deps = []
+            equations = fixup_equation(str(mdapi_counter.get('SnapshotReportReadEquation'))) + " " + \
+                        fixup_equation(str(mdapi_counter.get('SnapshotReportDeltaEquation'))) + " " + \
+                        fixup_equation(str(mdapi_counter.get('DeltaReportReadEquation'))) + " " + \
+                        fixup_equation(str(mdapi_counter.get('NormalizationEquation')))
+            equations = expand_macros(equations)
+            equations = equations.replace('$$', "$")
+            for token in equations.split():
+                if token[0] == '$' and token[1:] not in sys_vars and token[1:] != "Self":
+                    deps.append(token[1:])
+
+            mdapi_counters[symbol_name] = mdapi_counter
+            mdapi_counter_deps[symbol_name] = deps
+
+        sorted_mdapi_counters = sort_counters(mdapi_counters, mdapi_counter_deps)
+
+        for mdapi_counter in sorted_mdapi_counters:
+
+            aliases = mdapi_counter.get('Alias')
+
+            skip_counter = False
+
+            # We don't currently support configuring and reading perfmon registers
+            signal = mdapi_counter.get('SignalName')
+            if signal and "perfmon" in signal:
+                continue;
+
+            # A few things to fixup with this common counter...
+            if mdapi_counter.get('SymbolName') == "AvgGpuCoreFrequencyMHz":
+                # To avoid requiring a special case in tools, add a max value
+                # equation for the gpu frequency...
+                mdapi_counter.set('MaxValueEquation', "$GpuMaxFrequency")
+
+                # Don't include units in the name
+                mdapi_counter.set('SymbolName', "AvgGpuCoreFrequency")
+
+                # Use canonical, first order of magnitude units specifier
+                mdapi_counter.set('MetricUnits', 'Hz')
+                mdapi_counter.set('NormalizationEquation', '$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV')
+                #mdapi_counter.set('DeltaReportReadEquation', '$GpuCoreClocks $GpuTime UDIV')
+
+
+            symbol_name = mdapi_counter.get('SymbolName')
+
+            counter = et.SubElement(set, 'counter')
+            counter.set('name', apply_aliases(mdapi_counter.get('ShortName'), aliases))
+            counter.set('symbol_name', mdapi_counter.get('SymbolName'))
+            counter.set('underscore_name', underscore(mdapi_counter.get('SymbolName')))
+            counter.set('description', apply_aliases(mdapi_counter.get('LongName'), aliases))
+            counter.set('mdapi_group', apply_aliases(to_text(mdapi_counter.get('Group')), aliases))
+            counter.set('mdapi_usage_flags', to_text(mdapi_counter.get('UsageFlags')))
+            counter.set('mdapi_supported_apis', strip_dx_apis(mdapi_counter.get('SupportedAPI')))
+            low = mdapi_counter.get('LowWatermark')
+            if low:
+                counter.set('low_watermark', low)
+            high = to_text(mdapi_counter.get('HighWatermark'))
+            if high:
+                counter.set('high_watermark', high)
+            counter.set('data_type', mdapi_counter.get('ResultType').lower())
+
+            max_eq = fixup_equation(mdapi_counter.get('MaxValueEquation'))
+            if max_eq:
+                counter.set('max_equation', max_eq)
+
+            # XXX Not sure why EU metrics tend to just be bundled under 'gpu'
+            counter.set('mdapi_hw_unit_type', mdapi_counter.get('HWUnitType').lower())
+
+            # There are counters representing cycle counts that have a semantic
+            # type of 'duration' which doesn't seem to make sense...
+            units = mdapi_counter.get('MetricUnits').lower()
+            if units == "cycles":
+                semantic_type = "event"
+            else:
+                semantic_type = mdapi_counter.get('MetricType').lower()
+
+            counter.set('units', units)
+            counter.set('semantic_type', semantic_type)
+
+            # MDAPI MetricSets have 3 different kinds of counter read equations:
+            #
+            # 1) One for reading a raw (unnormalized) value from a hardware report
+            #
+            #       The line between normalized and raw isn't always clear
+            #       as the raw equation may e.g. read and ADD multiple counters
+            #
+            #       Not all counters have a raw equation if they are instead
+            #       derived through $CounterName references to other counters
+            #       in a normalized value equation
+            #
+            # 2) One for reading an unnormalized value from the accumulated 'delta reports'
+            #
+            #       Seems to duplicate the raw equation but with delta report
+            #       offsets and referencing 64bit values
+            #
+            #       The normalized value equations are always based on these
+            #       accumulated delta values
+            #
+            # 3) One for reading a normalized value
+            #
+            #       These may start with a reference to "$Self" which is
+            #       effectively a macro for the above delta report equation
+            #
+            #       If this is missing the delta report equation is effectively
+            #       the normalized equation too
+            #
+            #       XXX: Beware that there are some inconsistent counters that
+            #       have a normalization equation with a $Self reference and a
+            #       raw equation but no delta report equation. This seems
+            #       pretty sketchy, but (at least for 'MEDIA' metrics) we will
+            #       substitute the raw equation for $Self in this case along
+            #       with a warning to double check the results.
+            #
+            # Currently there doesn't appear to be a clear reason to
+            # differentiate these equations and the separation seems to
+            # complicate things for tools wanting to generate code from this
+            # data.
+            #
+            # We instead aim to have one normalized equation per counter that
+            # always reference accumulated counter values.
+
+            # XXX: As a special case, we override the raw and delta report
+            # equations for the GpuTime counters, which seem inconsistent
+            if mdapi_counter.get('SymbolName') == "GpuTime":
+                mdapi_counter.set('SnapshotReportReadEquation', "dw at 0x04 1000000000 UMUL $GpuTimestampFrequency UDIV")
+                mdapi_counter.set('DeltaReportReadEquation', "qw at 0x0 1000000000 UMUL $GpuTimestampFrequency UDIV")
+
+            availability = fixup_equation(mdapi_counter.get('AvailabilityEquation'))
+            if availability == "":
+                availability = None
+
+            # We prefer to only look at the equations that reference the raw
+            # reports since the mapping of offsets back to A,B,C counters is
+            # unambiguous, but if necessary we will fallback to mapping
+            # delta report offsets (accumulated 64bit values that correspond
+            # to the 32bit or 40bit values from raw repots)
+
+            raw_read_eq = fixup_equation(mdapi_counter.get('SnapshotReportReadEquation'))
+            if raw_read_eq:
+                if raw_read_eq == "":
+                    raw_read_eq = None
+                else:
+                    raw_read_eq = replace_read_tokens_with_rpn_read_ops(chipset,
+                                                                        raw_read_eq,
+                                                                        True) #raw offsets
+
+            delta_read_eq = fixup_equation(mdapi_counter.get('DeltaReportReadEquation'))
+            if delta_read_eq:
+                if delta_read_eq == "":
+                    delta_read_eq = None
+                else:
+                    delta_read_eq = replace_read_tokens_with_rpn_read_ops(chipset,
+                                                                          delta_read_eq,
+                                                                          False) #delta offsets
+
+            if raw_read_eq and not delta_read_eq:
+                print_err("WARNING: Counter with raw equation but no delta report equation: MetricSet=\"" + \
+                          mdapi_set.get('ShortName') + "\" Metric=\"" + mdapi_counter.get('SymbolName') + \
+                          "(" + mdapi_counter.get('ShortName') + ")" + "\"")
+                # Media metric counters currently have no delta equation even
+                # though they have normalization equations that reference $Self
+                if "MEDIA" in apis:
+                    print_err("WARNING: -> Treating inconsistent media metric's 'raw' equation as a 'delta report' equation, but results should be double checked!")
+                    delta_read_eq = raw_read_eq
+                else:
+                    set.remove(counter)
+                    continue
+
+            # Some counters are sourced from register values that are
+            # not put into the OA reports. This is why some counters
+            # will have a delta equation but not a raw equation. These
+            # counters are typically only available in query mode. For
+            # this reason we put a particular availability value.
+            if delta_read_eq and not raw_read_eq:
+                assert availability == None
+                availability = "true $QueryMode &&"
+                raw_read_eq = delta_read_eq
+
+            # After replacing read tokens with RPN counter READ ops the raw and
+            # delta equations are expected to be identical so warn if that's
+            # not true...
+            if bool(raw_read_eq) ^ bool(delta_read_eq) or raw_read_eq != delta_read_eq:
+                print_err("WARNING: Inconsistent raw and delta report equations for " + \
+                          mdapi_set.get('ShortName') + " :: " + mdapi_counter.get('SymbolName') + \
+                          "(" + mdapi_counter.get('ShortName') + ")" + ": raw=\"" + str(raw_read_eq) + \
+                          "\" delta=\"" + str(delta_read_eq) + "\" (SKIPPING)")
+                set.remove(counter)
+                continue
+
+            normalize_eq = fixup_equation(mdapi_counter.get('NormalizationEquation'))
+            if normalize_eq and normalize_eq == "":
+                normalize_eq = None
+
+            if normalize_eq:
+                # Some normalization equations are represented with macros such as
+                # 'GpuDuration' corresponding to:
+                #
+                #   "$Self 100 UMUL $GpuCoreClocks FDIV"
+                #
+                # We expand macros here so tools don't need to care about them...
+                #
+                equation = normalize_eq
+                equation = expand_macros(equation)
+                if raw_read_eq:
+                    equation = equation.replace('$Self', raw_read_eq)
+            else:
+                equation = delta_read_eq
+
+            if '$Self' in equation:
+                print_err("WARNING: Counter equation (\"" + equation + "\") with unexpanded $Self token: MetricSet=\"" + \
+                          mdapi_set.get('ShortName') + "\" Metric=\"" + mdapi_counter.get('SymbolName') + \
+                          "(" + mdapi_counter.get('ShortName') + ")" + "\" (SKIPPING)")
+                set.remove(counter)
+                continue
+
+            # $$CounterName vs $CounterName in an equation is intended to
+            # differentiate referencing the normalized or raw value of another
+            # counter.
+            #
+            # Since we are only keeping a single (normalized) equation for
+            # counters we only need one form, but we want to be careful to
+            # check if any equations really depend on the raw value of another
+            # counter so we can expand those variables now
+            #
+            tmp = equation
+            for token in tmp.split():
+                if token[0] == '$' and token[1] != '$':
+                    if token[1:] in normalization_equations:
+                        raw_eq = raw_equations[token[1:]]
+
+                        equation = equation.replace(token, raw_eq)
+                        #if token[1:] not in raw_equations:
+                        #   print_err("WARNING: Counter equation (\"" + equation + "\") references un-kept raw equation of another counter : MetricSet=\"" + \
+                        #             mdapi_set.get('ShortName') + "\" Metric=\"" + mdapi_counter.get('ShortName') + "\"")
+
+                    elif token[1:] not in raw_equations and token[1:] not in sys_vars:
+                        print_err("Unknown variable name: \"" + token + "\" in equation \"" + equation + "\"")
+
+            symbol_name = counter.get('symbol_name')
+
+            # Make sure that every variable in the equation is a known sys_var or counter name
+            equation = equation.replace('$$', "$")
+            for token in equation.split():
+                if token[0] == '$':
+                    if token[1:] not in counters and token[1:] not in sys_vars:
+                        print_err("WARNING: Counter equation (\"" + equation + "\") with unknown variable " + \
+                                  token + " (maybe skipped counter): MetricSet=\"" + mdapi_set.get('ShortName') + \
+                                  "\" Metric=\"" + mdapi_counter.get('SymbolName') + "(" + mdapi_counter.get('ShortName') + \
+                                  ")" + "\" (SKIPPING)")
+                        set.remove(counter)
+                        skip_counter = True
+                        break
+
+            if skip_counter:
+                continue
+
+            counter.set('equation', equation.strip())
+
+            if availability != None:
+                counter.set('availability', availability)
+
+            counters[symbol_name] = counter;
+            if normalize_eq:
+                normalization_equations[symbol_name] = normalize_eq
+            if raw_read_eq:
+                raw_equations[symbol_name] = raw_read_eq
+
+
+if args.dry_run:
+    sys.exit(0)
+
+# Merge in any custom meta data we have...
+if args.merge:
+    merge = et.parse(args.merge)
+    merge_metrics = merge.getroot()
+
+    for merge_set in merge.findall(".//set"):
+        pattern = ".//set[@symbol_name=\"" + merge_set.get('symbol_name') + "\"][@chipset=\"" + merge_set.get('chipset') + "\"]"
+        real_set = metrics.find(pattern)
+        if real_set is not None:
+            for set_attr in merge_set.items():
+                real_set.set(set_attr[0], set_attr[1])
+
+            for merge_elem in merge_set:
+                if merge_elem.tag == "counter":
+                    merge_counter = merge_elem
+                    pattern = "counter[@symbol_name=\"" + merge_counter.get('symbol_name') + "\"]"
+                    real_counter = real_set.find(pattern)
+                    if real_counter is not None:
+                        for counter_attr in merge_counter.items():
+                            real_counter.set(counter_attr[0], counter_attr[1])
+                    else:
+                        real_set.append(merge_counter)
+                        real_counter = merge_counter
+                else:
+                    real_set.append(merge_elem)
+
+    # For consistency + readability print everything manually...
+    merge_md5 = hashlib.md5(open("merge.xml", 'rb').read()).hexdigest()
+else:
+    merge_md5 = ""
+
+print ("<?xml version=\"1.0\"?>")
+print("<metrics version=\"" + str(int(time.time())) + "\" merge_md5=\"" + merge_md5 + "\">")
+for set in metrics.findall(".//set"):
+    print("  <set name=\"" + set.get('name') + "\"")
+    del set.attrib['name']
+    for attr in set.items():
+        print("       " + attr[0] + "=\"" + attr[1] + "\"")
+    print("       >")
+    for counter in set.findall("counter"):
+        print("    <counter name=\"" + counter.get('name') + "\"")
+        del counter.attrib['name']
+        for attr in counter.items():
+            if attr[0][:6] != "mdapi_":
+                print("             " + attr[0] + "=\"" + saxutils.escape(attr[1]) + "\"")
+        for attr in counter.items():
+            if attr[0][:6] == "mdapi_":
+                print("             " + attr[0] + "=\"" + saxutils.escape(attr[1]) + "\"")
+        print("             />")
+    for config in set.findall("register_config"):
+        if config.get('availability') != None:
+            print("    <register_config type=\"" + config.get('type') + "\"")
+            print("                     availability=\"" + saxutils.escape(config.get('availability')) + "\"")
+            print("                     priority=\"" + config.get('priority') + "\"")
+            print("                     >")
+        else:
+            print("    <register_config type=\"" + config.get('type') + "\">")
+        for reg in config.findall("register"):
+            addr = int(reg.get('address'), 16)
+
+            if 'registers' in chipsets[chipset] and addr in chipsets[chipset]['registers']:
+                reg_info = chipsets[chipset]['registers'][addr]
+                comment = ' <!--' + reg_info['name'] + ' -->'
+            else:
+                comment = ''
+
+            print("        <register type=\"" + reg.get('type') + "\" address=\"" + reg.get('address') + "\" value=\"" + reg.get('value') + "\" />" + comment)
+        print("    </register_config>")
+    print("  </set>\n")
+print("</metrics>")
diff --git a/lib/i915/perf-configs/oa-bdw.xml b/lib/i915/perf-configs/oa-bdw.xml
new file mode 100644
index 00000000..360e3c84
--- /dev/null
+++ b/lib/i915/perf-configs/oa-bdw.xml
@@ -0,0 +1,15653 @@
+<?xml version="1.0"?>
+<metrics version="1562317147" merge_md5="">
+  <set name="Render Metrics Basic Gen8"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="b541bd57-0e0f-4154-b4c0-5858010a2bf7"
+       chipset="BDW"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143F000F" />
+        <register type="NOA" address="0x00009888" value="0x14110014" />
+        <register type="NOA" address="0x00009888" value="0x14310014" />
+        <register type="NOA" address="0x00009888" value="0x14BF000F" />
+        <register type="NOA" address="0x00009888" value="0x118A0317" />
+        <register type="NOA" address="0x00009888" value="0x13837BE0" />
+        <register type="NOA" address="0x00009888" value="0x3B800060" />
+        <register type="NOA" address="0x00009888" value="0x3D800005" />
+        <register type="NOA" address="0x00009888" value="0x005C4000" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x003D8000" />
+        <register type="NOA" address="0x00009888" value="0x183D0800" />
+        <register type="NOA" address="0x00009888" value="0x0A3F0023" />
+        <register type="NOA" address="0x00009888" value="0x103F0000" />
+        <register type="NOA" address="0x00009888" value="0x00584000" />
+        <register type="NOA" address="0x00009888" value="0x08584000" />
+        <register type="NOA" address="0x00009888" value="0x0A5A4000" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B8000" />
+        <register type="NOA" address="0x00009888" value="0x185B2400" />
+        <register type="NOA" address="0x00009888" value="0x0A1D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA00" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18380001" />
+        <register type="NOA" address="0x00009888" value="0x00392000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A391000" />
+        <register type="NOA" address="0x00009888" value="0x00104000" />
+        <register type="NOA" address="0x00009888" value="0x08104000" />
+        <register type="NOA" address="0x00009888" value="0x00110030" />
+        <register type="NOA" address="0x00009888" value="0x08110031" />
+        <register type="NOA" address="0x00009888" value="0x10110000" />
+        <register type="NOA" address="0x00009888" value="0x00134000" />
+        <register type="NOA" address="0x00009888" value="0x16130020" />
+        <register type="NOA" address="0x00009888" value="0x06308000" />
+        <register type="NOA" address="0x00009888" value="0x08308000" />
+        <register type="NOA" address="0x00009888" value="0x06311800" />
+        <register type="NOA" address="0x00009888" value="0x08311880" />
+        <register type="NOA" address="0x00009888" value="0x10310000" />
+        <register type="NOA" address="0x00009888" value="0x0E334000" />
+        <register type="NOA" address="0x00009888" value="0x16330080" />
+        <register type="NOA" address="0x00009888" value="0x0ABF1180" />
+        <register type="NOA" address="0x00009888" value="0x10BF0000" />
+        <register type="NOA" address="0x00009888" value="0x0ADA8000" />
+        <register type="NOA" address="0x00009888" value="0x0A9D8000" />
+        <register type="NOA" address="0x00009888" value="0x109F0002" />
+        <register type="NOA" address="0x00009888" value="0x0AB94000" />
+        <register type="NOA" address="0x00009888" value="0x0D888000" />
+        <register type="NOA" address="0x00009888" value="0x038A0380" />
+        <register type="NOA" address="0x00009888" value="0x058A000E" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A00A0" />
+        <register type="NOA" address="0x00009888" value="0x078A0000" />
+        <register type="NOA" address="0x00009888" value="0x098A0000" />
+        <register type="NOA" address="0x00009888" value="0x238B2820" />
+        <register type="NOA" address="0x00009888" value="0x258B2550" />
+        <register type="NOA" address="0x00009888" value="0x198C1000" />
+        <register type="NOA" address="0x00009888" value="0x0B8D8000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x0D831021" />
+        <register type="NOA" address="0x00009888" value="0x0F83572F" />
+        <register type="NOA" address="0x00009888" value="0x01835680" />
+        <register type="NOA" address="0x00009888" value="0x0383002C" />
+        <register type="NOA" address="0x00009888" value="0x11830000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830001" />
+        <register type="NOA" address="0x00009888" value="0x05830000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x05844000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C137" />
+        <register type="NOA" address="0x00009888" value="0x1D80C147" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x15804000" />
+        <register type="NOA" address="0x00009888" value="0x4D801110" />
+        <register type="NOA" address="0x00009888" value="0x4F800331" />
+        <register type="NOA" address="0x00009888" value="0x43800802" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45801465" />
+        <register type="NOA" address="0x00009888" value="0x53801111" />
+        <register type="NOA" address="0x00009888" value="0x478014A5" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800CA5" />
+        <register type="NOA" address="0x00009888" value="0x41800003" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SliceMask 0x02 AND"
+                     priority="1"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143F000F" />
+        <register type="NOA" address="0x00009888" value="0x14BF000F" />
+        <register type="NOA" address="0x00009888" value="0x14910014" />
+        <register type="NOA" address="0x00009888" value="0x14B10014" />
+        <register type="NOA" address="0x00009888" value="0x118A0317" />
+        <register type="NOA" address="0x00009888" value="0x13837BE0" />
+        <register type="NOA" address="0x00009888" value="0x3B800060" />
+        <register type="NOA" address="0x00009888" value="0x3D800005" />
+        <register type="NOA" address="0x00009888" value="0x0A3F0023" />
+        <register type="NOA" address="0x00009888" value="0x103F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A5A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F8000" />
+        <register type="NOA" address="0x00009888" value="0x0A391000" />
+        <register type="NOA" address="0x00009888" value="0x00DC4000" />
+        <register type="NOA" address="0x00009888" value="0x06DC8000" />
+        <register type="NOA" address="0x00009888" value="0x08DCC000" />
+        <register type="NOA" address="0x00009888" value="0x00BD8000" />
+        <register type="NOA" address="0x00009888" value="0x18BD0800" />
+        <register type="NOA" address="0x00009888" value="0x0ABF1180" />
+        <register type="NOA" address="0x00009888" value="0x10BF0000" />
+        <register type="NOA" address="0x00009888" value="0x00D84000" />
+        <register type="NOA" address="0x00009888" value="0x08D84000" />
+        <register type="NOA" address="0x00009888" value="0x0ADA8000" />
+        <register type="NOA" address="0x00009888" value="0x00DB4000" />
+        <register type="NOA" address="0x00009888" value="0x0EDB8000" />
+        <register type="NOA" address="0x00009888" value="0x18DB2400" />
+        <register type="NOA" address="0x00009888" value="0x0A9D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C9F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E9F2A00" />
+        <register type="NOA" address="0x00009888" value="0x109F0002" />
+        <register type="NOA" address="0x00009888" value="0x00B84000" />
+        <register type="NOA" address="0x00009888" value="0x0EB84000" />
+        <register type="NOA" address="0x00009888" value="0x16B84000" />
+        <register type="NOA" address="0x00009888" value="0x18B80001" />
+        <register type="NOA" address="0x00009888" value="0x00B92000" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB94000" />
+        <register type="NOA" address="0x00009888" value="0x00904000" />
+        <register type="NOA" address="0x00009888" value="0x08904000" />
+        <register type="NOA" address="0x00009888" value="0x00910030" />
+        <register type="NOA" address="0x00009888" value="0x08910031" />
+        <register type="NOA" address="0x00009888" value="0x10910000" />
+        <register type="NOA" address="0x00009888" value="0x00934000" />
+        <register type="NOA" address="0x00009888" value="0x16930020" />
+        <register type="NOA" address="0x00009888" value="0x06B08000" />
+        <register type="NOA" address="0x00009888" value="0x08B08000" />
+        <register type="NOA" address="0x00009888" value="0x06B11800" />
+        <register type="NOA" address="0x00009888" value="0x08B11880" />
+        <register type="NOA" address="0x00009888" value="0x10B10000" />
+        <register type="NOA" address="0x00009888" value="0x0EB34000" />
+        <register type="NOA" address="0x00009888" value="0x16B30080" />
+        <register type="NOA" address="0x00009888" value="0x01888000" />
+        <register type="NOA" address="0x00009888" value="0x0D88B800" />
+        <register type="NOA" address="0x00009888" value="0x038A0380" />
+        <register type="NOA" address="0x00009888" value="0x058A000E" />
+        <register type="NOA" address="0x00009888" value="0x1B8A0080" />
+        <register type="NOA" address="0x00009888" value="0x078A0000" />
+        <register type="NOA" address="0x00009888" value="0x098A0000" />
+        <register type="NOA" address="0x00009888" value="0x238B2840" />
+        <register type="NOA" address="0x00009888" value="0x258B26A0" />
+        <register type="NOA" address="0x00009888" value="0x018C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C1100" />
+        <register type="NOA" address="0x00009888" value="0x018D2000" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8D8000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x0D831021" />
+        <register type="NOA" address="0x00009888" value="0x0F83572F" />
+        <register type="NOA" address="0x00009888" value="0x01835680" />
+        <register type="NOA" address="0x00009888" value="0x0383002C" />
+        <register type="NOA" address="0x00009888" value="0x11830000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830001" />
+        <register type="NOA" address="0x00009888" value="0x05830000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x05844000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C137" />
+        <register type="NOA" address="0x00009888" value="0x1D80C147" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x15804000" />
+        <register type="NOA" address="0x00009888" value="0x4D801550" />
+        <register type="NOA" address="0x00009888" value="0x4F800331" />
+        <register type="NOA" address="0x00009888" value="0x43800802" />
+        <register type="NOA" address="0x00009888" value="0x51800400" />
+        <register type="NOA" address="0x00009888" value="0x458004A1" />
+        <register type="NOA" address="0x00009888" value="0x53805555" />
+        <register type="NOA" address="0x00009888" value="0x47800421" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801421" />
+        <register type="NOA" address="0x00009888" value="0x41800845" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen8"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="35fbc9b2-a891-40a6-a38d-022bb7057552"
+       chipset="BDW"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of typed memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL  $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x105C00E0" />
+        <register type="NOA" address="0x00009888" value="0x105800E0" />
+        <register type="NOA" address="0x00009888" value="0x103800E0" />
+        <register type="NOA" address="0x00009888" value="0x3580001A" />
+        <register type="NOA" address="0x00009888" value="0x3B800060" />
+        <register type="NOA" address="0x00009888" value="0x3D800005" />
+        <register type="NOA" address="0x00009888" value="0x065C2100" />
+        <register type="NOA" address="0x00009888" value="0x0A5C0041" />
+        <register type="NOA" address="0x00009888" value="0x0C5C6600" />
+        <register type="NOA" address="0x00009888" value="0x005C6580" />
+        <register type="NOA" address="0x00009888" value="0x085C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5C8000" />
+        <register type="NOA" address="0x00009888" value="0x00580042" />
+        <register type="NOA" address="0x00009888" value="0x08582080" />
+        <register type="NOA" address="0x00009888" value="0x0C58004C" />
+        <register type="NOA" address="0x00009888" value="0x0E582580" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B1000" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0104" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA00" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x08380042" />
+        <register type="NOA" address="0x00009888" value="0x0A382080" />
+        <register type="NOA" address="0x00009888" value="0x0E38404C" />
+        <register type="NOA" address="0x00009888" value="0x0238404B" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x16380000" />
+        <register type="NOA" address="0x00009888" value="0x18381145" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x02392000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B02A0" />
+        <register type="NOA" address="0x00009888" value="0x258B5550" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x1F850A80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x03844000" />
+        <register type="NOA" address="0x00009888" value="0x17808137" />
+        <register type="NOA" address="0x00009888" value="0x1980C147" />
+        <register type="NOA" address="0x00009888" value="0x1B80C0E5" />
+        <register type="NOA" address="0x00009888" value="0x1D80C0E3" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x13804000" />
+        <register type="NOA" address="0x00009888" value="0x15800000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D801000" />
+        <register type="NOA" address="0x00009888" value="0x4F800111" />
+        <register type="NOA" address="0x00009888" value="0x43800062" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800062" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800062" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801062" />
+        <register type="NOA" address="0x00009888" value="0x41801084" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SliceMask 0x02 AND"
+                     priority="2"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x10DC00E0" />
+        <register type="NOA" address="0x00009888" value="0x10D800E0" />
+        <register type="NOA" address="0x00009888" value="0x10B800E0" />
+        <register type="NOA" address="0x00009888" value="0x3580001A" />
+        <register type="NOA" address="0x00009888" value="0x3B800060" />
+        <register type="NOA" address="0x00009888" value="0x3D800005" />
+        <register type="NOA" address="0x00009888" value="0x06DC2100" />
+        <register type="NOA" address="0x00009888" value="0x0ADC0041" />
+        <register type="NOA" address="0x00009888" value="0x0CDC6600" />
+        <register type="NOA" address="0x00009888" value="0x00DC6580" />
+        <register type="NOA" address="0x00009888" value="0x08DC8000" />
+        <register type="NOA" address="0x00009888" value="0x0EDC8000" />
+        <register type="NOA" address="0x00009888" value="0x00D80042" />
+        <register type="NOA" address="0x00009888" value="0x08D82080" />
+        <register type="NOA" address="0x00009888" value="0x0CD8004C" />
+        <register type="NOA" address="0x00009888" value="0x0ED82580" />
+        <register type="NOA" address="0x00009888" value="0x00DB4000" />
+        <register type="NOA" address="0x00009888" value="0x18DB1000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0104" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA00" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x08B80042" />
+        <register type="NOA" address="0x00009888" value="0x0AB82080" />
+        <register type="NOA" address="0x00009888" value="0x0EB8404C" />
+        <register type="NOA" address="0x00009888" value="0x02B8404B" />
+        <register type="NOA" address="0x00009888" value="0x00B84000" />
+        <register type="NOA" address="0x00009888" value="0x16B80000" />
+        <register type="NOA" address="0x00009888" value="0x18B81145" />
+        <register type="NOA" address="0x00009888" value="0x04B80000" />
+        <register type="NOA" address="0x00009888" value="0x00B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x02B92000" />
+        <register type="NOA" address="0x00009888" value="0x01888000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x238B0540" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA0" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x018C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x018DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038D2000" />
+        <register type="NOA" address="0x00009888" value="0x1F850A80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x03844000" />
+        <register type="NOA" address="0x00009888" value="0x17808137" />
+        <register type="NOA" address="0x00009888" value="0x1980C147" />
+        <register type="NOA" address="0x00009888" value="0x1B80C0E5" />
+        <register type="NOA" address="0x00009888" value="0x1D80C0E3" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x13804000" />
+        <register type="NOA" address="0x00009888" value="0x15800000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D805000" />
+        <register type="NOA" address="0x00009888" value="0x4F800555" />
+        <register type="NOA" address="0x00009888" value="0x43800062" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800062" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800062" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800062" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="233d0544-fff7-4281-8291-e02f222aff72"
+       chipset="BDW"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x0A1E0000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F000F" />
+        <register type="NOA" address="0x00009888" value="0x10176800" />
+        <register type="NOA" address="0x00009888" value="0x1191001F" />
+        <register type="NOA" address="0x00009888" value="0x0B880320" />
+        <register type="NOA" address="0x00009888" value="0x01890C40" />
+        <register type="NOA" address="0x00009888" value="0x118A1C00" />
+        <register type="NOA" address="0x00009888" value="0x118D7C00" />
+        <register type="NOA" address="0x00009888" value="0x118E0020" />
+        <register type="NOA" address="0x00009888" value="0x118F4C00" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x13900001" />
+        <register type="NOA" address="0x00009888" value="0x065C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C3D8000" />
+        <register type="NOA" address="0x00009888" value="0x06584000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B4000" />
+        <register type="NOA" address="0x00009888" value="0x081E0040" />
+        <register type="NOA" address="0x00009888" value="0x0E1E0000" />
+        <register type="NOA" address="0x00009888" value="0x021F5400" />
+        <register type="NOA" address="0x00009888" value="0x001F0000" />
+        <register type="NOA" address="0x00009888" value="0x101F0010" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0080" />
+        <register type="NOA" address="0x00009888" value="0x0C384000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0C13C000" />
+        <register type="NOA" address="0x00009888" value="0x06164000" />
+        <register type="NOA" address="0x00009888" value="0x06170012" />
+        <register type="NOA" address="0x00009888" value="0x00170000" />
+        <register type="NOA" address="0x00009888" value="0x01910005" />
+        <register type="NOA" address="0x00009888" value="0x07880002" />
+        <register type="NOA" address="0x00009888" value="0x01880C00" />
+        <register type="NOA" address="0x00009888" value="0x0F880000" />
+        <register type="NOA" address="0x00009888" value="0x0D880000" />
+        <register type="NOA" address="0x00009888" value="0x05880000" />
+        <register type="NOA" address="0x00009888" value="0x09890032" />
+        <register type="NOA" address="0x00009888" value="0x078A0800" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0A00" />
+        <register type="NOA" address="0x00009888" value="0x198A4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A2000" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x038A4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B54C0" />
+        <register type="NOA" address="0x00009888" value="0x258BAA55" />
+        <register type="NOA" address="0x00009888" value="0x278B0019" />
+        <register type="NOA" address="0x00009888" value="0x198C0100" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8D0015" />
+        <register type="NOA" address="0x00009888" value="0x018D1000" />
+        <register type="NOA" address="0x00009888" value="0x098D8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DF000" />
+        <register type="NOA" address="0x00009888" value="0x0D8D3000" />
+        <register type="NOA" address="0x00009888" value="0x038DE000" />
+        <register type="NOA" address="0x00009888" value="0x058D3000" />
+        <register type="NOA" address="0x00009888" value="0x0D8E0004" />
+        <register type="NOA" address="0x00009888" value="0x058E000C" />
+        <register type="NOA" address="0x00009888" value="0x098E0000" />
+        <register type="NOA" address="0x00009888" value="0x078E0000" />
+        <register type="NOA" address="0x00009888" value="0x038E0000" />
+        <register type="NOA" address="0x00009888" value="0x0B8F0020" />
+        <register type="NOA" address="0x00009888" value="0x198F0C00" />
+        <register type="NOA" address="0x00009888" value="0x078F8000" />
+        <register type="NOA" address="0x00009888" value="0x098F4000" />
+        <register type="NOA" address="0x00009888" value="0x0B900980" />
+        <register type="NOA" address="0x00009888" value="0x03900D80" />
+        <register type="NOA" address="0x00009888" value="0x01900000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D801111" />
+        <register type="NOA" address="0x00009888" value="0x3D800800" />
+        <register type="NOA" address="0x00009888" value="0x4F801011" />
+        <register type="NOA" address="0x00009888" value="0x43800443" />
+        <register type="NOA" address="0x00009888" value="0x51801111" />
+        <register type="NOA" address="0x00009888" value="0x45800422" />
+        <register type="NOA" address="0x00009888" value="0x53801111" />
+        <register type="NOA" address="0x00009888" value="0x47800C60" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800422" />
+        <register type="NOA" address="0x00009888" value="0x41800021" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen8"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="2b255d48-2117-4fef-a8f7-f151e1d25a2c"
+       chipset="BDW"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x198B0343" />
+        <register type="NOA" address="0x00009888" value="0x13845800" />
+        <register type="NOA" address="0x00009888" value="0x15840018" />
+        <register type="NOA" address="0x00009888" value="0x3580001A" />
+        <register type="NOA" address="0x00009888" value="0x038B6300" />
+        <register type="NOA" address="0x00009888" value="0x058B6B62" />
+        <register type="NOA" address="0x00009888" value="0x078B006A" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x238B0000" />
+        <register type="NOA" address="0x00009888" value="0x258B0000" />
+        <register type="NOA" address="0x00009888" value="0x1F85A080" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385000A" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x01840018" />
+        <register type="NOA" address="0x00009888" value="0x07844C80" />
+        <register type="NOA" address="0x00009888" value="0x09840D9A" />
+        <register type="NOA" address="0x00009888" value="0x0B840E9C" />
+        <register type="NOA" address="0x00009888" value="0x0D840F9E" />
+        <register type="NOA" address="0x00009888" value="0x0F840010" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x03848000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x2F8000E5" />
+        <register type="NOA" address="0x00009888" value="0x138080E3" />
+        <register type="NOA" address="0x00009888" value="0x1580C0E1" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x11804000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F804000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800800" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800842" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800842" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801042" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800084" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen8"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="f7fd3220-b466-4a4d-9f98-b0caf3f2394c"
+       chipset="BDW"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x198B0343" />
+        <register type="NOA" address="0x00009888" value="0x13845400" />
+        <register type="NOA" address="0x00009888" value="0x3580001A" />
+        <register type="NOA" address="0x00009888" value="0x3D800805" />
+        <register type="NOA" address="0x00009888" value="0x038B6300" />
+        <register type="NOA" address="0x00009888" value="0x058B6B62" />
+        <register type="NOA" address="0x00009888" value="0x078B006A" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x238B0000" />
+        <register type="NOA" address="0x00009888" value="0x258B0000" />
+        <register type="NOA" address="0x00009888" value="0x1F85A080" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x23850002" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x01840010" />
+        <register type="NOA" address="0x00009888" value="0x07844880" />
+        <register type="NOA" address="0x00009888" value="0x09840992" />
+        <register type="NOA" address="0x00009888" value="0x0B840A94" />
+        <register type="NOA" address="0x00009888" value="0x0D840B96" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x03848000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x2D800147" />
+        <register type="NOA" address="0x00009888" value="0x2F8000E5" />
+        <register type="NOA" address="0x00009888" value="0x138080E3" />
+        <register type="NOA" address="0x00009888" value="0x1580C0E1" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x11804000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F800000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800842" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800842" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801082" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800084" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen8"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="e99ccaca-821c-4df9-97a7-96bdb7204e43"
+       chipset="BDW"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="Ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu atomic requests to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="Ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu requests to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="Ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu requests to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="Ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu requests to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="Ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu requests to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143D0160" />
+        <register type="NOA" address="0x00009888" value="0x163D2800" />
+        <register type="NOA" address="0x00009888" value="0x183D0120" />
+        <register type="NOA" address="0x00009888" value="0x105800E0" />
+        <register type="NOA" address="0x00009888" value="0x005CC000" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5CC000" />
+        <register type="NOA" address="0x00009888" value="0x025CC000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x003D0011" />
+        <register type="NOA" address="0x00009888" value="0x063D0900" />
+        <register type="NOA" address="0x00009888" value="0x083D0A13" />
+        <register type="NOA" address="0x00009888" value="0x0A3D0B15" />
+        <register type="NOA" address="0x00009888" value="0x0C3D2317" />
+        <register type="NOA" address="0x00009888" value="0x043D21B7" />
+        <register type="NOA" address="0x00009888" value="0x103D0000" />
+        <register type="NOA" address="0x00009888" value="0x0E3D0000" />
+        <register type="NOA" address="0x00009888" value="0x1A3D0000" />
+        <register type="NOA" address="0x00009888" value="0x0E5825C1" />
+        <register type="NOA" address="0x00009888" value="0x00586100" />
+        <register type="NOA" address="0x00009888" value="0x0258204C" />
+        <register type="NOA" address="0x00009888" value="0x06588000" />
+        <register type="NOA" address="0x00009888" value="0x0858C000" />
+        <register type="NOA" address="0x00009888" value="0x0A58C000" />
+        <register type="NOA" address="0x00009888" value="0x0C58C000" />
+        <register type="NOA" address="0x00009888" value="0x0458C000" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B5400" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0155" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18381555" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x06384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B2AA0" />
+        <register type="NOA" address="0x00009888" value="0x258B5551" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x02 AND"
+                     priority="2"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x105C00E0" />
+        <register type="NOA" address="0x00009888" value="0x145B0160" />
+        <register type="NOA" address="0x00009888" value="0x165B2800" />
+        <register type="NOA" address="0x00009888" value="0x185B0120" />
+        <register type="NOA" address="0x00009888" value="0x0E5C25C1" />
+        <register type="NOA" address="0x00009888" value="0x005C6100" />
+        <register type="NOA" address="0x00009888" value="0x025C204C" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5CC000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x005B0011" />
+        <register type="NOA" address="0x00009888" value="0x065B0900" />
+        <register type="NOA" address="0x00009888" value="0x085B0A13" />
+        <register type="NOA" address="0x00009888" value="0x0A5B0B15" />
+        <register type="NOA" address="0x00009888" value="0x0C5B2317" />
+        <register type="NOA" address="0x00009888" value="0x045B21B7" />
+        <register type="NOA" address="0x00009888" value="0x105B0000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B0000" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18381555" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x06384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B2AA0" />
+        <register type="NOA" address="0x00009888" value="0x258B5551" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x04 AND"
+                     priority="4"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x103800E0" />
+        <register type="NOA" address="0x00009888" value="0x143A0160" />
+        <register type="NOA" address="0x00009888" value="0x163A2800" />
+        <register type="NOA" address="0x00009888" value="0x183A0120" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0E38A5C1" />
+        <register type="NOA" address="0x00009888" value="0x0038A100" />
+        <register type="NOA" address="0x00009888" value="0x0238204C" />
+        <register type="NOA" address="0x00009888" value="0x16388000" />
+        <register type="NOA" address="0x00009888" value="0x183802AA" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x06380000" />
+        <register type="NOA" address="0x00009888" value="0x08388000" />
+        <register type="NOA" address="0x00009888" value="0x0A388000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x003A0011" />
+        <register type="NOA" address="0x00009888" value="0x063A0900" />
+        <register type="NOA" address="0x00009888" value="0x083A0A13" />
+        <register type="NOA" address="0x00009888" value="0x0A3A0B15" />
+        <register type="NOA" address="0x00009888" value="0x0C3A2317" />
+        <register type="NOA" address="0x00009888" value="0x043A21B7" />
+        <register type="NOA" address="0x00009888" value="0x103A0000" />
+        <register type="NOA" address="0x00009888" value="0x0E3A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A3A0000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B2AA0" />
+        <register type="NOA" address="0x00009888" value="0x258B5551" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x08 AND"
+                     priority="1"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x14BD0160" />
+        <register type="NOA" address="0x00009888" value="0x16BD2800" />
+        <register type="NOA" address="0x00009888" value="0x18BD0120" />
+        <register type="NOA" address="0x00009888" value="0x10D800E0" />
+        <register type="NOA" address="0x00009888" value="0x00DCC000" />
+        <register type="NOA" address="0x00009888" value="0x06DC8000" />
+        <register type="NOA" address="0x00009888" value="0x08DCC000" />
+        <register type="NOA" address="0x00009888" value="0x0ADCC000" />
+        <register type="NOA" address="0x00009888" value="0x0CDCC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDCC000" />
+        <register type="NOA" address="0x00009888" value="0x02DCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DCC000" />
+        <register type="NOA" address="0x00009888" value="0x00BD0011" />
+        <register type="NOA" address="0x00009888" value="0x06BD0900" />
+        <register type="NOA" address="0x00009888" value="0x08BD0A13" />
+        <register type="NOA" address="0x00009888" value="0x0ABD0B15" />
+        <register type="NOA" address="0x00009888" value="0x0CBD2317" />
+        <register type="NOA" address="0x00009888" value="0x04BD21B7" />
+        <register type="NOA" address="0x00009888" value="0x10BD0000" />
+        <register type="NOA" address="0x00009888" value="0x0EBD0000" />
+        <register type="NOA" address="0x00009888" value="0x1ABD0000" />
+        <register type="NOA" address="0x00009888" value="0x0ED825C1" />
+        <register type="NOA" address="0x00009888" value="0x00D86100" />
+        <register type="NOA" address="0x00009888" value="0x02D8204C" />
+        <register type="NOA" address="0x00009888" value="0x06D88000" />
+        <register type="NOA" address="0x00009888" value="0x08D8C000" />
+        <register type="NOA" address="0x00009888" value="0x0AD8C000" />
+        <register type="NOA" address="0x00009888" value="0x0CD8C000" />
+        <register type="NOA" address="0x00009888" value="0x04D8C000" />
+        <register type="NOA" address="0x00009888" value="0x00DB4000" />
+        <register type="NOA" address="0x00009888" value="0x0EDB4000" />
+        <register type="NOA" address="0x00009888" value="0x18DB5400" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0155" />
+        <register type="NOA" address="0x00009888" value="0x02DB4000" />
+        <register type="NOA" address="0x00009888" value="0x04DB4000" />
+        <register type="NOA" address="0x00009888" value="0x06DB4000" />
+        <register type="NOA" address="0x00009888" value="0x08DB4000" />
+        <register type="NOA" address="0x00009888" value="0x0ADB4000" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x00B84000" />
+        <register type="NOA" address="0x00009888" value="0x0EB84000" />
+        <register type="NOA" address="0x00009888" value="0x16B84000" />
+        <register type="NOA" address="0x00009888" value="0x18B81555" />
+        <register type="NOA" address="0x00009888" value="0x02B84000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB84000" />
+        <register type="NOA" address="0x00009888" value="0x00B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x01888000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x238B5540" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA2" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x018C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x018DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x10 AND"
+                     priority="3"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x10DC00E0" />
+        <register type="NOA" address="0x00009888" value="0x14DB0160" />
+        <register type="NOA" address="0x00009888" value="0x16DB2800" />
+        <register type="NOA" address="0x00009888" value="0x18DB0120" />
+        <register type="NOA" address="0x00009888" value="0x0EDC25C1" />
+        <register type="NOA" address="0x00009888" value="0x00DC6100" />
+        <register type="NOA" address="0x00009888" value="0x02DC204C" />
+        <register type="NOA" address="0x00009888" value="0x06DC8000" />
+        <register type="NOA" address="0x00009888" value="0x08DCC000" />
+        <register type="NOA" address="0x00009888" value="0x0ADCC000" />
+        <register type="NOA" address="0x00009888" value="0x0CDCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DCC000" />
+        <register type="NOA" address="0x00009888" value="0x00DB0011" />
+        <register type="NOA" address="0x00009888" value="0x06DB0900" />
+        <register type="NOA" address="0x00009888" value="0x08DB0A13" />
+        <register type="NOA" address="0x00009888" value="0x0ADB0B15" />
+        <register type="NOA" address="0x00009888" value="0x0CDB2317" />
+        <register type="NOA" address="0x00009888" value="0x04DB21B7" />
+        <register type="NOA" address="0x00009888" value="0x10DB0000" />
+        <register type="NOA" address="0x00009888" value="0x0EDB0000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0000" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x00B84000" />
+        <register type="NOA" address="0x00009888" value="0x0EB84000" />
+        <register type="NOA" address="0x00009888" value="0x16B84000" />
+        <register type="NOA" address="0x00009888" value="0x18B81555" />
+        <register type="NOA" address="0x00009888" value="0x02B84000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB84000" />
+        <register type="NOA" address="0x00009888" value="0x00B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x01888000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x238B5540" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA2" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x018C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x018DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x20 AND"
+                     priority="5"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x10B800E0" />
+        <register type="NOA" address="0x00009888" value="0x14BA0160" />
+        <register type="NOA" address="0x00009888" value="0x16BA2800" />
+        <register type="NOA" address="0x00009888" value="0x18BA0120" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA2A" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0EB8A5C1" />
+        <register type="NOA" address="0x00009888" value="0x00B8A100" />
+        <register type="NOA" address="0x00009888" value="0x02B8204C" />
+        <register type="NOA" address="0x00009888" value="0x16B88000" />
+        <register type="NOA" address="0x00009888" value="0x18B802AA" />
+        <register type="NOA" address="0x00009888" value="0x04B80000" />
+        <register type="NOA" address="0x00009888" value="0x06B80000" />
+        <register type="NOA" address="0x00009888" value="0x08B88000" />
+        <register type="NOA" address="0x00009888" value="0x0AB88000" />
+        <register type="NOA" address="0x00009888" value="0x00B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x00BA0011" />
+        <register type="NOA" address="0x00009888" value="0x06BA0900" />
+        <register type="NOA" address="0x00009888" value="0x08BA0A13" />
+        <register type="NOA" address="0x00009888" value="0x0ABA0B15" />
+        <register type="NOA" address="0x00009888" value="0x0CBA2317" />
+        <register type="NOA" address="0x00009888" value="0x04BA21B7" />
+        <register type="NOA" address="0x00009888" value="0x10BA0000" />
+        <register type="NOA" address="0x00009888" value="0x0EBA0000" />
+        <register type="NOA" address="0x00009888" value="0x1ABA0000" />
+        <register type="NOA" address="0x00009888" value="0x01888000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x238B5540" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA2" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x018C4000" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x018DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA2" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen8"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="27a364dc-8225-4ecb-b607-d6f1925598d9"
+       chipset="BDW"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ C 2 READ C 3 READ B 6 READ B 7 READ UADD UADD UADD UADD UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OCL OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OCL OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="L3 Bank 10 Accesses"
+             description="The total number of accesses to L3 Bank 10."
+             data_type="uint64"
+             equation="C 2 READ 2 UMUL"
+             underscore_name="l3_bank10_accesses"
+             units="messages"
+             symbol_name="L3Bank10Accesses"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 10 IC Accesses"
+             description="The total number of accesses to L3 Bank 10 from IC cache."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD 2 UMUL $L3Bank10Accesses UMIN"
+             underscore_name="l3_bank10_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank10IcAccesses"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 10 IC Hits"
+             description="The total number of hits in L3 Bank 10 from IC cache."
+             data_type="uint64"
+             equation="B 5 READ 2 UMUL $L3Bank10IcAccesses UMIN"
+             underscore_name="l3_bank10_ic_hits"
+             units="messages"
+             symbol_name="L3Bank10IcHits"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 11 Accesses"
+             description="The total number of accesses to L3 Bank 11."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="l3_bank11_accesses"
+             units="messages"
+             symbol_name="L3Bank11Accesses"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Bank 13 Accesses"
+             description="The total number of accesses to L3 Bank 13."
+             data_type="uint64"
+             equation="B 7 READ 2 UMUL"
+             underscore_name="l3_bank13_accesses"
+             units="messages"
+             symbol_name="L3Bank13Accesses"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="L3 Bank 12 Accesses"
+             description="The total number of accesses to L3 Bank 12."
+             data_type="uint64"
+             equation="B 6 READ 2 UMUL"
+             underscore_name="l3_bank12_accesses"
+             units="messages"
+             symbol_name="L3Bank12Accesses"
+             availability="$SliceMask 0x02 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143F00B3" />
+        <register type="NOA" address="0x00009888" value="0x14BF00B3" />
+        <register type="NOA" address="0x00009888" value="0x138303C0" />
+        <register type="NOA" address="0x00009888" value="0x3B800060" />
+        <register type="NOA" address="0x00009888" value="0x3D800805" />
+        <register type="NOA" address="0x00009888" value="0x003F0029" />
+        <register type="NOA" address="0x00009888" value="0x063F1400" />
+        <register type="NOA" address="0x00009888" value="0x083F1225" />
+        <register type="NOA" address="0x00009888" value="0x0E3F1327" />
+        <register type="NOA" address="0x00009888" value="0x103F0000" />
+        <register type="NOA" address="0x00009888" value="0x005A4000" />
+        <register type="NOA" address="0x00009888" value="0x065A8000" />
+        <register type="NOA" address="0x00009888" value="0x085AC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5AC000" />
+        <register type="NOA" address="0x00009888" value="0x001D4000" />
+        <register type="NOA" address="0x00009888" value="0x061D8000" />
+        <register type="NOA" address="0x00009888" value="0x081DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E1F2A00" />
+        <register type="NOA" address="0x00009888" value="0x101F0280" />
+        <register type="NOA" address="0x00009888" value="0x00391000" />
+        <register type="NOA" address="0x00009888" value="0x06394000" />
+        <register type="NOA" address="0x00009888" value="0x08395000" />
+        <register type="NOA" address="0x00009888" value="0x0E395000" />
+        <register type="NOA" address="0x00009888" value="0x0ABF1429" />
+        <register type="NOA" address="0x00009888" value="0x0CBF1225" />
+        <register type="NOA" address="0x00009888" value="0x00BF1380" />
+        <register type="NOA" address="0x00009888" value="0x02BF0026" />
+        <register type="NOA" address="0x00009888" value="0x10BF0000" />
+        <register type="NOA" address="0x00009888" value="0x0ADAC000" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x00DA8000" />
+        <register type="NOA" address="0x00009888" value="0x02DA4000" />
+        <register type="NOA" address="0x00009888" value="0x0A9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x009D8000" />
+        <register type="NOA" address="0x00009888" value="0x029D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F8000" />
+        <register type="NOA" address="0x00009888" value="0x109F002A" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0AB95000" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x00B94000" />
+        <register type="NOA" address="0x00009888" value="0x02B91000" />
+        <register type="NOA" address="0x00009888" value="0x0D88C000" />
+        <register type="NOA" address="0x00009888" value="0x0F880003" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A8020" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x238B0520" />
+        <register type="NOA" address="0x00009888" value="0x258BA950" />
+        <register type="NOA" address="0x00009888" value="0x278B0016" />
+        <register type="NOA" address="0x00009888" value="0x198C5400" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0001" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038D2000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x03835180" />
+        <register type="NOA" address="0x00009888" value="0x05834022" />
+        <register type="NOA" address="0x00009888" value="0x11830000" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x05844000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C137" />
+        <register type="NOA" address="0x00009888" value="0x1D80C147" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x15804000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D801000" />
+        <register type="NOA" address="0x00009888" value="0x4F800111" />
+        <register type="NOA" address="0x00009888" value="0x43800842" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800840" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800800" />
+        <register type="NOA" address="0x00009888" value="0x418014A2" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Data Port Reads Coalescing Gen8"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="data_port_reads_coalescing"
+       hw_config_guid="857fc630-2f09-4804-85f1-084adfadd5ab"
+       chipset="BDW"
+       symbol_name="DataPortReadsCoalescing"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU to Data Port 0 Reads 64"
+             description="The subslice 0 EU data reads from Data Port with 64B per message."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_hdc0_reads64_b"
+             units="messages"
+             symbol_name="EuHdc0Reads64B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Data Port 0 to L3 Data Reads"
+             description="The subslice 0 Data Port data and constant reads from L3 cache."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="hdc0_l3_data_reads"
+             units="messages"
+             symbol_name="Hdc0L3DataReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Data Port 0 to L3 Data Writes"
+             description="The subslice 0 Data Port data writes to L3 cache."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="hdc0_l3_data_writes"
+             units="messages"
+             symbol_name="Hdc0L3DataWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU to Data Port 0 Reads 128"
+             description="The subslice 0 EU data reads from Data Port with 128B per message."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_hdc0_reads128_b"
+             units="messages"
+             symbol_name="EuHdc0Reads128B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="All Data Port 0 Writes to L3"
+             description="The subslice 0 Data Port writes to L3 cache."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="hdc0_l3_writes"
+             units="messages"
+             symbol_name="Hdc0L3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU to Data Port 0 Reads 32"
+             description="The subslice 0 EU data reads from Data Port with 32B per message."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_hdc0_reads32_b"
+             units="messages"
+             symbol_name="EuHdc0Reads32B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU to Data Port 0 Reads 256"
+             description="The subslice 0 EU data reads from Data Port with 256B per message."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_hdc0_reads256_b"
+             units="messages"
+             symbol_name="EuHdc0Reads256B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuBytesReadPerCacheLine"
+             description="Average EU bytes read per L3 cache line."
+             data_type="float"
+             equation="$EuHdc0Reads32B 32 UMUL $EuHdc0Reads64B 64 UMUL $EuHdc0Reads128B 128 UMUL $EuHdc0Reads256B 256 UMUL UADD UADD UADD $Hdc0L3DataReads FDIV"
+             underscore_name="eu_bytes_read_per_cache_line"
+             units="eu bytes per l3 cache line"
+             symbol_name="EuBytesReadPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuDataReadsPerCacheLine"
+             description="Coalescing ratio of EU read requests to L3 cache lines."
+             data_type="float"
+             equation="$EuBytesReadPerCacheLine 64 FDIV"
+             underscore_name="eu_data_reads_per_cache_line"
+             units="utilization"
+             symbol_name="EuDataReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="All Data Port 0 Reads from L3"
+             description="The subslice 0 Data Port reads from L3 cache."
+             data_type="uint64"
+             equation="C 3 READ C 2 READ USUB"
+             underscore_name="hdc0_l3_reads"
+             units="messages"
+             symbol_name="Hdc0L3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x103D0005" />
+        <register type="NOA" address="0x00009888" value="0x163D240B" />
+        <register type="NOA" address="0x00009888" value="0x1058022F" />
+        <register type="NOA" address="0x00009888" value="0x185B5520" />
+        <register type="NOA" address="0x00009888" value="0x198B0003" />
+        <register type="NOA" address="0x00009888" value="0x005CC000" />
+        <register type="NOA" address="0x00009888" value="0x065CC000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5CC000" />
+        <register type="NOA" address="0x00009888" value="0x025C4000" />
+        <register type="NOA" address="0x00009888" value="0x045C8000" />
+        <register type="NOA" address="0x00009888" value="0x003D0000" />
+        <register type="NOA" address="0x00009888" value="0x063D00B0" />
+        <register type="NOA" address="0x00009888" value="0x083D0182" />
+        <register type="NOA" address="0x00009888" value="0x0A3D10A0" />
+        <register type="NOA" address="0x00009888" value="0x0C3D11A2" />
+        <register type="NOA" address="0x00009888" value="0x0E3D0000" />
+        <register type="NOA" address="0x00009888" value="0x183D0000" />
+        <register type="NOA" address="0x00009888" value="0x1A3D0000" />
+        <register type="NOA" address="0x00009888" value="0x0E582242" />
+        <register type="NOA" address="0x00009888" value="0x00586700" />
+        <register type="NOA" address="0x00009888" value="0x0258004F" />
+        <register type="NOA" address="0x00009888" value="0x0658C000" />
+        <register type="NOA" address="0x00009888" value="0x0858C000" />
+        <register type="NOA" address="0x00009888" value="0x0A58C000" />
+        <register type="NOA" address="0x00009888" value="0x0C58C000" />
+        <register type="NOA" address="0x00009888" value="0x045B6300" />
+        <register type="NOA" address="0x00009888" value="0x105B0000" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0155" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B0000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAAA0" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18381555" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C384000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x0639A000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x02392000" />
+        <register type="NOA" address="0x00009888" value="0x04398000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x038B6300" />
+        <register type="NOA" address="0x00009888" value="0x058B0062" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x238B02A0" />
+        <register type="NOA" address="0x00009888" value="0x258B5555" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D801000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800001" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800041" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0xBA98BA98" />
+        <register type="OA" address="0x00002748" value="0xBA98BA98" />
+        <register type="OA" address="0x00002744" value="0x00003377" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFF2" />
+        <register type="OA" address="0x00002774" value="0x00007FF0" />
+        <register type="OA" address="0x00002778" value="0x0007FFE2" />
+        <register type="OA" address="0x0000277C" value="0x00007FF0" />
+        <register type="OA" address="0x00002780" value="0x0007FFC2" />
+        <register type="OA" address="0x00002784" value="0x00007FF0" />
+        <register type="OA" address="0x00002788" value="0x0007FF82" />
+        <register type="OA" address="0x0000278C" value="0x00007FF0" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000BFEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000BFDF" />
+        <register type="OA" address="0x000027A0" value="0x0007FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000BFBF" />
+        <register type="OA" address="0x000027A8" value="0x0007FFFA" />
+        <register type="OA" address="0x000027AC" value="0x0000BF7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Data Port Writes Coalescing Gen8"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="data_port_writes_coalescing"
+       hw_config_guid="343ebc99-4a55-414c-8c17-d8e259cf5e20"
+       chipset="BDW"
+       symbol_name="DataPortWritesCoalescing"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU to Data Port 0 Writes 128"
+             description="The subslice 0 EU data simd16 writes to Data Port with 192B per message."
+             data_type="uint64"
+             equation="B 6 READ 2 UDIV"
+             underscore_name="eu_hdc0_writes192_b"
+             units="messages"
+             symbol_name="EuHdc0Writes192B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="EU to Data Port 0 Writes 32B"
+             description="The subslice 0 EU data writes to Data Port with 32B per message."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_hdc0_writes32_b"
+             units="messages"
+             symbol_name="EuHdc0Writes32B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU to Data Port 0 Writes 256B"
+             description="The subslice 0 EU data simd16 writes to Data Port with 256B per message."
+             data_type="uint64"
+             equation="B 7 READ 2 UDIV"
+             underscore_name="eu_hdc0_writes256_b_simd16"
+             units="messages"
+             symbol_name="EuHdc0Writes256BSimd16"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Data Port 0 to L3 Data Reads"
+             description="The subslice 0 Data Port data and constant reads from L3 cache."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="hdc0_l3_data_reads"
+             units="messages"
+             symbol_name="Hdc0L3DataReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Data Port 0 to L3 Data Writes"
+             description="The subslice 0 Data Port data writes to L3 cache."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="hdc0_l3_data_writes"
+             units="messages"
+             symbol_name="Hdc0L3DataWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU to Data Port 0 Writes 64B"
+             description="The subslice 0 EU data simd16 writes to Data Port with 128B per message."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_hdc0_writes128_b_simd16"
+             units="messages"
+             symbol_name="EuHdc0Writes128BSimd16"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU to Data Port 0 Writes 64B"
+             description="The subslice 0 EU data writes to Data Port with 64B per message."
+             data_type="uint64"
+             equation="B 2 READ 2 UDIV"
+             underscore_name="eu_hdc0_writes96_b"
+             units="messages"
+             symbol_name="EuHdc0Writes96B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="All Data Port 0 Writes to L3"
+             description="The subslice 0 Data Port writes to L3 cache."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="hdc0_l3_writes"
+             units="messages"
+             symbol_name="Hdc0L3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU to Data Port 0 Writes 64B"
+             description="The subslice 0 EU data writes to Data Port with 64B per message."
+             data_type="uint64"
+             equation="B 1 READ B 4 READ UADD"
+             underscore_name="eu_hdc0_writes64_b"
+             units="messages"
+             symbol_name="EuHdc0Writes64B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU to Data Port 0 Writes 128"
+             description="The subslice 0 EU data writes to Data Port with 128B per message."
+             data_type="uint64"
+             equation="B 3 READ 2 UDIV"
+             underscore_name="eu_hdc0_writes128_b"
+             units="messages"
+             symbol_name="EuHdc0Writes128B"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuBytesWrittenPerCacheLine"
+             description="Average EU bytes written per L3 cache line."
+             data_type="float"
+             equation="$EuHdc0Writes32B 32 UMUL $EuHdc0Writes64B 64 UMUL $EuHdc0Writes96B 96 UMUL $EuHdc0Writes128B 128 UMUL $EuHdc0Writes128BSimd16 128 UMUL $EuHdc0Writes256BSimd16 256 UMUL $EuHdc0Writes192B 192 UMUL UADD UADD UADD UADD UADD UADD $Hdc0L3DataWrites FDIV"
+             underscore_name="eu_bytes_written_per_cache_line"
+             units="eu bytes per l3 cache line"
+             symbol_name="EuBytesWrittenPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuDataWritesPerCacheLine"
+             description="Coalescing ratio of EU write requests to L3 cache lines."
+             data_type="float"
+             equation="$EuBytesWrittenPerCacheLine 64 FDIV"
+             underscore_name="eu_data_writes_per_cache_line"
+             units="utilization"
+             symbol_name="EuDataWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL 2 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="All Data Port 0 Reads from L3"
+             description="The subslice 0 Data Port reads from L3 cache."
+             data_type="uint64"
+             equation="C 3 READ C 2 READ USUB"
+             underscore_name="hdc0_l3_reads"
+             units="messages"
+             symbol_name="Hdc0L3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x103D0005" />
+        <register type="NOA" address="0x00009888" value="0x143D0120" />
+        <register type="NOA" address="0x00009888" value="0x163D2400" />
+        <register type="NOA" address="0x00009888" value="0x1058022F" />
+        <register type="NOA" address="0x00009888" value="0x105B0000" />
+        <register type="NOA" address="0x00009888" value="0x198B0003" />
+        <register type="NOA" address="0x00009888" value="0x005CC000" />
+        <register type="NOA" address="0x00009888" value="0x065CC000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5CC000" />
+        <register type="NOA" address="0x00009888" value="0x025C4000" />
+        <register type="NOA" address="0x00009888" value="0x045C8000" />
+        <register type="NOA" address="0x00009888" value="0x003D0000" />
+        <register type="NOA" address="0x00009888" value="0x063D0094" />
+        <register type="NOA" address="0x00009888" value="0x083D0182" />
+        <register type="NOA" address="0x00009888" value="0x0A3D1814" />
+        <register type="NOA" address="0x00009888" value="0x0E3D0000" />
+        <register type="NOA" address="0x00009888" value="0x183D0000" />
+        <register type="NOA" address="0x00009888" value="0x1A3D0000" />
+        <register type="NOA" address="0x00009888" value="0x0C3D0000" />
+        <register type="NOA" address="0x00009888" value="0x0E582242" />
+        <register type="NOA" address="0x00009888" value="0x00586700" />
+        <register type="NOA" address="0x00009888" value="0x0258004F" />
+        <register type="NOA" address="0x00009888" value="0x0658C000" />
+        <register type="NOA" address="0x00009888" value="0x0858C000" />
+        <register type="NOA" address="0x00009888" value="0x0A58C000" />
+        <register type="NOA" address="0x00009888" value="0x045B6A80" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B5400" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0141" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B0000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAAA0" />
+        <register type="NOA" address="0x00009888" value="0x101F0282" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18381415" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C384000" />
+        <register type="NOA" address="0x00009888" value="0x0039A000" />
+        <register type="NOA" address="0x00009888" value="0x0639A000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x02392000" />
+        <register type="NOA" address="0x00009888" value="0x04398000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A82A0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x038B6300" />
+        <register type="NOA" address="0x00009888" value="0x058B0062" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x238B02A0" />
+        <register type="NOA" address="0x00009888" value="0x258B1555" />
+        <register type="NOA" address="0x00009888" value="0x278B0014" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x21852AAA" />
+        <register type="NOA" address="0x00009888" value="0x23850028" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830141" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00000D24" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x4D801000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800001" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800420" />
+        <register type="NOA" address="0x00009888" value="0x3F800421" />
+        <register type="NOA" address="0x00009888" value="0x41800041" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0xBA98BA98" />
+        <register type="OA" address="0x00002748" value="0xBA98BA98" />
+        <register type="OA" address="0x00002744" value="0x00003377" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FF72" />
+        <register type="OA" address="0x00002774" value="0x0000BFD0" />
+        <register type="OA" address="0x00002778" value="0x0007FF62" />
+        <register type="OA" address="0x0000277C" value="0x0000BFD0" />
+        <register type="OA" address="0x00002780" value="0x0007FF42" />
+        <register type="OA" address="0x00002784" value="0x0000BFD0" />
+        <register type="OA" address="0x00002788" value="0x0007FF02" />
+        <register type="OA" address="0x0000278C" value="0x0000BFD0" />
+        <register type="OA" address="0x00002790" value="0x0005FFF2" />
+        <register type="OA" address="0x00002794" value="0x0000BFD0" />
+        <register type="OA" address="0x00002798" value="0x0005FFE2" />
+        <register type="OA" address="0x0000279C" value="0x0000BFD0" />
+        <register type="OA" address="0x000027A0" value="0x0005FFC2" />
+        <register type="OA" address="0x000027A4" value="0x0000BFD0" />
+        <register type="OA" address="0x000027A8" value="0x0005FF82" />
+        <register type="OA" address="0x000027AC" value="0x0000BFD0" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="78490af2-10fa-430b-ae3c-94ec04d5214e"
+       chipset="BDW"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ C 0 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader12_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader12AccessStalledOnL3"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ B 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader10_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader10AccessStalledOnL3"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ B 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader11_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader11AccessStalledOnL3"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x105C0232" />
+        <register type="NOA" address="0x00009888" value="0x10580232" />
+        <register type="NOA" address="0x00009888" value="0x10380232" />
+        <register type="NOA" address="0x00009888" value="0x10DC0232" />
+        <register type="NOA" address="0x00009888" value="0x10D80232" />
+        <register type="NOA" address="0x00009888" value="0x10B80232" />
+        <register type="NOA" address="0x00009888" value="0x118E4400" />
+        <register type="NOA" address="0x00009888" value="0x025C6080" />
+        <register type="NOA" address="0x00009888" value="0x045C004B" />
+        <register type="NOA" address="0x00009888" value="0x005C8000" />
+        <register type="NOA" address="0x00009888" value="0x00582080" />
+        <register type="NOA" address="0x00009888" value="0x0258004B" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x04386080" />
+        <register type="NOA" address="0x00009888" value="0x0638404B" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A380000" />
+        <register type="NOA" address="0x00009888" value="0x0C380000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0CDC25C1" />
+        <register type="NOA" address="0x00009888" value="0x0ADCC000" />
+        <register type="NOA" address="0x00009888" value="0x0AD825C1" />
+        <register type="NOA" address="0x00009888" value="0x18DB4000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0001" />
+        <register type="NOA" address="0x00009888" value="0x0E9F8000" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0EB825C1" />
+        <register type="NOA" address="0x00009888" value="0x18B80154" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0D88C000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258BAA05" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C5400" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x098DC000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x098E05C0" />
+        <register type="NOA" address="0x00009888" value="0x058E0000" />
+        <register type="NOA" address="0x00009888" value="0x198F0020" />
+        <register type="NOA" address="0x00009888" value="0x2185AA0A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x19835000" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x19808000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x51800040" />
+        <register type="NOA" address="0x00009888" value="0x43800400" />
+        <register type="NOA" address="0x00009888" value="0x45800800" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800C62" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801042" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x418014A4" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FFF7" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="c0abdd97-3b13-4cad-814c-bd178804e02c"
+       chipset="BDW"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank1 Stalled"
+             description="The percentage of time in which slice1 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_stalled"
+             units="percent"
+             symbol_name="L31Bank1Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice1 L3 Bank0 Stalled"
+             description="The percentage of time in which slice1 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_stalled"
+             units="percent"
+             symbol_name="L31Bank0Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank1 Active"
+             description="The percentage of time in which slice1 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_active"
+             units="percent"
+             symbol_name="L31Bank1Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank0 Active"
+             description="The percentage of time in which slice1 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_active"
+             units="percent"
+             symbol_name="L31Bank0Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x10BF03DA" />
+        <register type="NOA" address="0x00009888" value="0x14BF0001" />
+        <register type="NOA" address="0x00009888" value="0x12980340" />
+        <register type="NOA" address="0x00009888" value="0x12990340" />
+        <register type="NOA" address="0x00009888" value="0x0CBF1187" />
+        <register type="NOA" address="0x00009888" value="0x0EBF1205" />
+        <register type="NOA" address="0x00009888" value="0x00BF0500" />
+        <register type="NOA" address="0x00009888" value="0x02BF042B" />
+        <register type="NOA" address="0x00009888" value="0x04BF002C" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x00DA8000" />
+        <register type="NOA" address="0x00009888" value="0x02DAC000" />
+        <register type="NOA" address="0x00009888" value="0x04DA4000" />
+        <register type="NOA" address="0x00009888" value="0x04983400" />
+        <register type="NOA" address="0x00009888" value="0x10980000" />
+        <register type="NOA" address="0x00009888" value="0x06990034" />
+        <register type="NOA" address="0x00009888" value="0x10990000" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x009D8000" />
+        <register type="NOA" address="0x00009888" value="0x029DC000" />
+        <register type="NOA" address="0x00009888" value="0x049D4000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00BA" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x00B94000" />
+        <register type="NOA" address="0x00009888" value="0x02B95000" />
+        <register type="NOA" address="0x00009888" value="0x04B91000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA4000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x258B800A" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x47800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800060" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="ad665281-a7cf-483a-bd10-0e07c43f61c7"
+       chipset="BDW"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x103F03DA" />
+        <register type="NOA" address="0x00009888" value="0x143F0001" />
+        <register type="NOA" address="0x00009888" value="0x12180340" />
+        <register type="NOA" address="0x00009888" value="0x12190340" />
+        <register type="NOA" address="0x00009888" value="0x0C3F1187" />
+        <register type="NOA" address="0x00009888" value="0x0E3F1205" />
+        <register type="NOA" address="0x00009888" value="0x003F0500" />
+        <register type="NOA" address="0x00009888" value="0x023F042B" />
+        <register type="NOA" address="0x00009888" value="0x043F002C" />
+        <register type="NOA" address="0x00009888" value="0x0C5AC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5AC000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x04183400" />
+        <register type="NOA" address="0x00009888" value="0x10180000" />
+        <register type="NOA" address="0x00009888" value="0x06190034" />
+        <register type="NOA" address="0x00009888" value="0x10190000" />
+        <register type="NOA" address="0x00009888" value="0x0C1DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1DC000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x101F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00BA" />
+        <register type="NOA" address="0x00009888" value="0x0C388000" />
+        <register type="NOA" address="0x00009888" value="0x0C395000" />
+        <register type="NOA" address="0x00009888" value="0x0E395000" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04391000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AA800" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B4005" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x47800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800060" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="930a15aa-4300-4fce-a9ba-edb0b9e880be"
+       chipset="BDW"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank3 Active"
+             description="The percentage of time in which slice1 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank3_active"
+             units="percent"
+             symbol_name="L31Bank3Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 L3 Bank3 Stalled"
+             description="The percentage of time in which slice1 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank3_stalled"
+             units="percent"
+             symbol_name="L31Bank3Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x121B0340" />
+        <register type="NOA" address="0x00009888" value="0x103F0274" />
+        <register type="NOA" address="0x00009888" value="0x123F0000" />
+        <register type="NOA" address="0x00009888" value="0x129B0340" />
+        <register type="NOA" address="0x00009888" value="0x10BF0274" />
+        <register type="NOA" address="0x00009888" value="0x12BF0000" />
+        <register type="NOA" address="0x00009888" value="0x041B3400" />
+        <register type="NOA" address="0x00009888" value="0x101B0000" />
+        <register type="NOA" address="0x00009888" value="0x045C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3D4000" />
+        <register type="NOA" address="0x00009888" value="0x003F0080" />
+        <register type="NOA" address="0x00009888" value="0x023F0793" />
+        <register type="NOA" address="0x00009888" value="0x043F0014" />
+        <register type="NOA" address="0x00009888" value="0x04588000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F002A" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04399000" />
+        <register type="NOA" address="0x00009888" value="0x069B0034" />
+        <register type="NOA" address="0x00009888" value="0x109B0000" />
+        <register type="NOA" address="0x00009888" value="0x06DC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CBD4000" />
+        <register type="NOA" address="0x00009888" value="0x0CBF0981" />
+        <register type="NOA" address="0x00009888" value="0x0EBF0A0F" />
+        <register type="NOA" address="0x00009888" value="0x06D84000" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0CDB4000" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0080" />
+        <register type="NOA" address="0x00009888" value="0x0CB84000" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B8009" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800C00" />
+        <register type="NOA" address="0x00009888" value="0x47800C63" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F8014A5" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800045" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_4"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_4"
+       hw_config_guid="d7793b26-b5e3-4f0f-ad78-7ebc9d0b4c7d"
+       chipset="BDW"
+       symbol_name="L3_4"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank2 Active"
+             description="The percentage of time in which slice1 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_active"
+             units="percent"
+             symbol_name="L31Bank2Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank2 Stalled"
+             description="The percentage of time in which slice1 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_stalled"
+             units="percent"
+             symbol_name="L31Bank2Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x121A0340" />
+        <register type="NOA" address="0x00009888" value="0x103F0017" />
+        <register type="NOA" address="0x00009888" value="0x123F0020" />
+        <register type="NOA" address="0x00009888" value="0x129A0340" />
+        <register type="NOA" address="0x00009888" value="0x10BF0017" />
+        <register type="NOA" address="0x00009888" value="0x12BF0020" />
+        <register type="NOA" address="0x00009888" value="0x041A3400" />
+        <register type="NOA" address="0x00009888" value="0x101A0000" />
+        <register type="NOA" address="0x00009888" value="0x043B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3E0010" />
+        <register type="NOA" address="0x00009888" value="0x003F0200" />
+        <register type="NOA" address="0x00009888" value="0x023F0113" />
+        <register type="NOA" address="0x00009888" value="0x043F0014" />
+        <register type="NOA" address="0x00009888" value="0x02592000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F001A" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04391000" />
+        <register type="NOA" address="0x00009888" value="0x069A0034" />
+        <register type="NOA" address="0x00009888" value="0x109A0000" />
+        <register type="NOA" address="0x00009888" value="0x06BB4000" />
+        <register type="NOA" address="0x00009888" value="0x0ABE0040" />
+        <register type="NOA" address="0x00009888" value="0x0CBF0984" />
+        <register type="NOA" address="0x00009888" value="0x0EBF0A02" />
+        <register type="NOA" address="0x00009888" value="0x02D94000" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0C9C0400" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C9E0400" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0040" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B8009" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800800" />
+        <register type="NOA" address="0x00009888" value="0x47800842" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801084" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800044" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="da0f7875-1143-4d73-a39c-9128a951c46a"
+       chipset="BDW"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Rasterizer Input Available"
+             description="The percentage of time in which slice1 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_input_available"
+             units="percent"
+             symbol_name="Rasterizer1InputAvailable"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Pixel Values Ready"
+             description="The percentage of time in which slice1 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values1_ready"
+             units="percent"
+             symbol_name="PixelValues1Ready"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 PS Output Available"
+             description="The percentage of time in which slice1 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output1_available"
+             units="percent"
+             symbol_name="PSOutput1Available"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice1 Rasterizer Output Ready"
+             description="The percentage of time in which slice1 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_output_ready"
+             units="percent"
+             symbol_name="Rasterizer1OutputReady"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice1 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data1_ready"
+             units="percent"
+             symbol_name="PixelData1Ready"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143B000E" />
+        <register type="NOA" address="0x00009888" value="0x043C55C0" />
+        <register type="NOA" address="0x00009888" value="0x0A1E0280" />
+        <register type="NOA" address="0x00009888" value="0x0C1E0408" />
+        <register type="NOA" address="0x00009888" value="0x10390000" />
+        <register type="NOA" address="0x00009888" value="0x12397A1F" />
+        <register type="NOA" address="0x00009888" value="0x14BB000E" />
+        <register type="NOA" address="0x00009888" value="0x04BC5000" />
+        <register type="NOA" address="0x00009888" value="0x0A9E0296" />
+        <register type="NOA" address="0x00009888" value="0x0C9E0008" />
+        <register type="NOA" address="0x00009888" value="0x10B90000" />
+        <register type="NOA" address="0x00009888" value="0x12B97A1F" />
+        <register type="NOA" address="0x00009888" value="0x063B0042" />
+        <register type="NOA" address="0x00009888" value="0x103B0000" />
+        <register type="NOA" address="0x00009888" value="0x083C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A3E0040" />
+        <register type="NOA" address="0x00009888" value="0x043F8000" />
+        <register type="NOA" address="0x00009888" value="0x02594000" />
+        <register type="NOA" address="0x00009888" value="0x045A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1C0400" />
+        <register type="NOA" address="0x00009888" value="0x041D8000" />
+        <register type="NOA" address="0x00009888" value="0x081E02C0" />
+        <register type="NOA" address="0x00009888" value="0x0E1E0000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0260" />
+        <register type="NOA" address="0x00009888" value="0x101F0014" />
+        <register type="NOA" address="0x00009888" value="0x003905E0" />
+        <register type="NOA" address="0x00009888" value="0x06390BC0" />
+        <register type="NOA" address="0x00009888" value="0x02390018" />
+        <register type="NOA" address="0x00009888" value="0x04394000" />
+        <register type="NOA" address="0x00009888" value="0x04BB0042" />
+        <register type="NOA" address="0x00009888" value="0x10BB0000" />
+        <register type="NOA" address="0x00009888" value="0x02BC05C0" />
+        <register type="NOA" address="0x00009888" value="0x08BC0000" />
+        <register type="NOA" address="0x00009888" value="0x0ABE0004" />
+        <register type="NOA" address="0x00009888" value="0x02BF8000" />
+        <register type="NOA" address="0x00009888" value="0x02D91000" />
+        <register type="NOA" address="0x00009888" value="0x02DA8000" />
+        <register type="NOA" address="0x00009888" value="0x089C8000" />
+        <register type="NOA" address="0x00009888" value="0x029D8000" />
+        <register type="NOA" address="0x00009888" value="0x089E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E9E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E9FA806" />
+        <register type="NOA" address="0x00009888" value="0x109F0142" />
+        <register type="NOA" address="0x00009888" value="0x08B90617" />
+        <register type="NOA" address="0x00009888" value="0x0AB90BE0" />
+        <register type="NOA" address="0x00009888" value="0x02B94000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000C" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A2800" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B52A0" />
+        <register type="NOA" address="0x00009888" value="0x258B6A95" />
+        <register type="NOA" address="0x00009888" value="0x278B0029" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C1500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0014" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038D8000" />
+        <register type="NOA" address="0x00009888" value="0x058D2000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4D800444" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F804000" />
+        <register type="NOA" address="0x00009888" value="0x43801080" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800084" />
+        <register type="NOA" address="0x00009888" value="0x53800044" />
+        <register type="NOA" address="0x00009888" value="0x47801080" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800840" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00006000" />
+        <register type="OA" address="0x00002774" value="0x0000F3FF" />
+        <register type="OA" address="0x00002778" value="0x00001800" />
+        <register type="OA" address="0x0000277C" value="0x0000FCFF" />
+        <register type="OA" address="0x00002780" value="0x00000600" />
+        <register type="OA" address="0x00002784" value="0x0000FF3F" />
+        <register type="OA" address="0x00002788" value="0x00000180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000060" />
+        <register type="OA" address="0x00002794" value="0x0000FFF3" />
+        <register type="OA" address="0x00002798" value="0x00000018" />
+        <register type="OA" address="0x0000279C" value="0x0000FFFC" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler_1"
+       hw_config_guid="52c186e4-39e3-4534-87cd-41bd47763df9"
+       chipset="BDW"
+       symbol_name="Sampler_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Slice1 Subslice0 Input Available"
+             description="The percentage of time in which slice1 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_input_available"
+             units="percent"
+             symbol_name="Sampler10InputAvailable"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice1 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler12_output_ready"
+             units="percent"
+             symbol_name="Sampler12OutputReady"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Subslice1 Input Available"
+             description="The percentage of time in which slice1 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_input_available"
+             units="percent"
+             symbol_name="Sampler11InputAvailable"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice1 Subslice2 Input Available"
+             description="The percentage of time in which slice1 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler12_input_available"
+             units="percent"
+             symbol_name="Sampler12InputAvailable"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice1 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_output_ready"
+             units="percent"
+             symbol_name="Sampler10OutputReady"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Slice1 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_output_ready"
+             units="percent"
+             symbol_name="Sampler11OutputReady"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x18921400" />
+        <register type="NOA" address="0x00009888" value="0x149500AB" />
+        <register type="NOA" address="0x00009888" value="0x18B21400" />
+        <register type="NOA" address="0x00009888" value="0x14B500AB" />
+        <register type="NOA" address="0x00009888" value="0x18D21400" />
+        <register type="NOA" address="0x00009888" value="0x14D500AB" />
+        <register type="NOA" address="0x00009888" value="0x0CDC8000" />
+        <register type="NOA" address="0x00009888" value="0x0EDC4000" />
+        <register type="NOA" address="0x00009888" value="0x02DCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DCC000" />
+        <register type="NOA" address="0x00009888" value="0x1ABD00A0" />
+        <register type="NOA" address="0x00009888" value="0x0ABD8000" />
+        <register type="NOA" address="0x00009888" value="0x0CD88000" />
+        <register type="NOA" address="0x00009888" value="0x0ED84000" />
+        <register type="NOA" address="0x00009888" value="0x04D88000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0050" />
+        <register type="NOA" address="0x00009888" value="0x04DB8000" />
+        <register type="NOA" address="0x00009888" value="0x06DB8000" />
+        <register type="NOA" address="0x00009888" value="0x08DB8000" />
+        <register type="NOA" address="0x00009888" value="0x0ADB4000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A0" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00AA" />
+        <register type="NOA" address="0x00009888" value="0x18B82500" />
+        <register type="NOA" address="0x00009888" value="0x02B88000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB84000" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB98000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x00B98000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x1ABA0200" />
+        <register type="NOA" address="0x00009888" value="0x02BA8000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA8000" />
+        <register type="NOA" address="0x00009888" value="0x04908000" />
+        <register type="NOA" address="0x00009888" value="0x04918000" />
+        <register type="NOA" address="0x00009888" value="0x04927300" />
+        <register type="NOA" address="0x00009888" value="0x10920000" />
+        <register type="NOA" address="0x00009888" value="0x1893000A" />
+        <register type="NOA" address="0x00009888" value="0x0A934000" />
+        <register type="NOA" address="0x00009888" value="0x0A946000" />
+        <register type="NOA" address="0x00009888" value="0x0C959000" />
+        <register type="NOA" address="0x00009888" value="0x0E950098" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x04B04000" />
+        <register type="NOA" address="0x00009888" value="0x04B14000" />
+        <register type="NOA" address="0x00009888" value="0x04B20073" />
+        <register type="NOA" address="0x00009888" value="0x10B20000" />
+        <register type="NOA" address="0x00009888" value="0x04B38000" />
+        <register type="NOA" address="0x00009888" value="0x06B38000" />
+        <register type="NOA" address="0x00009888" value="0x08B34000" />
+        <register type="NOA" address="0x00009888" value="0x04B4C000" />
+        <register type="NOA" address="0x00009888" value="0x02B59890" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x06D04000" />
+        <register type="NOA" address="0x00009888" value="0x06D14000" />
+        <register type="NOA" address="0x00009888" value="0x06D20073" />
+        <register type="NOA" address="0x00009888" value="0x10D20000" />
+        <register type="NOA" address="0x00009888" value="0x18D30020" />
+        <register type="NOA" address="0x00009888" value="0x02D38000" />
+        <register type="NOA" address="0x00009888" value="0x0CD34000" />
+        <register type="NOA" address="0x00009888" value="0x0AD48000" />
+        <register type="NOA" address="0x00009888" value="0x04D42000" />
+        <register type="NOA" address="0x00009888" value="0x0ED59000" />
+        <register type="NOA" address="0x00009888" value="0x00D59800" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000E" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x258B000A" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8D8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x1B830150" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D848000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D808000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801021" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800C64" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800C02" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler_2"
+       hw_config_guid="edcb8c31-764d-451a-9ecd-c9c89fb54f8d"
+       chipset="BDW"
+       symbol_name="Sampler_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x18121400" />
+        <register type="NOA" address="0x00009888" value="0x141500AB" />
+        <register type="NOA" address="0x00009888" value="0x18321400" />
+        <register type="NOA" address="0x00009888" value="0x143500AB" />
+        <register type="NOA" address="0x00009888" value="0x18521400" />
+        <register type="NOA" address="0x00009888" value="0x145500AB" />
+        <register type="NOA" address="0x00009888" value="0x0C5C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5C4000" />
+        <register type="NOA" address="0x00009888" value="0x025CC000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x1A3D00A0" />
+        <register type="NOA" address="0x00009888" value="0x0A3D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C588000" />
+        <register type="NOA" address="0x00009888" value="0x0E584000" />
+        <register type="NOA" address="0x00009888" value="0x04588000" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0050" />
+        <register type="NOA" address="0x00009888" value="0x045B8000" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x101F02A0" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x18382500" />
+        <register type="NOA" address="0x00009888" value="0x02388000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x06384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C388000" />
+        <register type="NOA" address="0x00009888" value="0x0C398000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x1A3A0200" />
+        <register type="NOA" address="0x00009888" value="0x023A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A8000" />
+        <register type="NOA" address="0x00009888" value="0x04108000" />
+        <register type="NOA" address="0x00009888" value="0x04118000" />
+        <register type="NOA" address="0x00009888" value="0x04127300" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x1813000A" />
+        <register type="NOA" address="0x00009888" value="0x0A134000" />
+        <register type="NOA" address="0x00009888" value="0x0A146000" />
+        <register type="NOA" address="0x00009888" value="0x0C159000" />
+        <register type="NOA" address="0x00009888" value="0x0E150098" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04304000" />
+        <register type="NOA" address="0x00009888" value="0x04314000" />
+        <register type="NOA" address="0x00009888" value="0x04320073" />
+        <register type="NOA" address="0x00009888" value="0x10320000" />
+        <register type="NOA" address="0x00009888" value="0x04338000" />
+        <register type="NOA" address="0x00009888" value="0x06338000" />
+        <register type="NOA" address="0x00009888" value="0x08334000" />
+        <register type="NOA" address="0x00009888" value="0x0434C000" />
+        <register type="NOA" address="0x00009888" value="0x02359890" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x06504000" />
+        <register type="NOA" address="0x00009888" value="0x06514000" />
+        <register type="NOA" address="0x00009888" value="0x06520073" />
+        <register type="NOA" address="0x00009888" value="0x10520000" />
+        <register type="NOA" address="0x00009888" value="0x18530020" />
+        <register type="NOA" address="0x00009888" value="0x02538000" />
+        <register type="NOA" address="0x00009888" value="0x0C534000" />
+        <register type="NOA" address="0x00009888" value="0x0A548000" />
+        <register type="NOA" address="0x00009888" value="0x04542000" />
+        <register type="NOA" address="0x00009888" value="0x0E559000" />
+        <register type="NOA" address="0x00009888" value="0x00559800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AA000" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x258B0005" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x1B830150" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D848000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D808000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801021" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800C64" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800C02" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="729fc3f4-ccff-4902-be6b-f1a22cc92c02"
+       chipset="BDW"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread11ReadyForDispatch"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread12_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread12ReadyForDispatch"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread10ReadyForDispatch"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread12_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread12ReadyForDispatch"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread10ReadyForDispatch"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread11ReadyForDispatch"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x16154D60" />
+        <register type="NOA" address="0x00009888" value="0x16352E60" />
+        <register type="NOA" address="0x00009888" value="0x16554D60" />
+        <register type="NOA" address="0x00009888" value="0x16950000" />
+        <register type="NOA" address="0x00009888" value="0x16B50000" />
+        <register type="NOA" address="0x00009888" value="0x16D50000" />
+        <register type="NOA" address="0x00009888" value="0x005C8000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x065C4000" />
+        <register type="NOA" address="0x00009888" value="0x083D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3D8000" />
+        <register type="NOA" address="0x00009888" value="0x0458C000" />
+        <register type="NOA" address="0x00009888" value="0x025B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04388000" />
+        <register type="NOA" address="0x00009888" value="0x06388000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C384000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x043A8000" />
+        <register type="NOA" address="0x00009888" value="0x063A8000" />
+        <register type="NOA" address="0x00009888" value="0x08138000" />
+        <register type="NOA" address="0x00009888" value="0x0A138000" />
+        <register type="NOA" address="0x00009888" value="0x06143000" />
+        <register type="NOA" address="0x00009888" value="0x0415CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x02338000" />
+        <register type="NOA" address="0x00009888" value="0x0C338000" />
+        <register type="NOA" address="0x00009888" value="0x04342000" />
+        <register type="NOA" address="0x00009888" value="0x06344000" />
+        <register type="NOA" address="0x00009888" value="0x0035C700" />
+        <register type="NOA" address="0x00009888" value="0x063500CF" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04538000" />
+        <register type="NOA" address="0x00009888" value="0x06538000" />
+        <register type="NOA" address="0x00009888" value="0x0454C000" />
+        <register type="NOA" address="0x00009888" value="0x0255CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06DC8000" />
+        <register type="NOA" address="0x00009888" value="0x08DC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CDCC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDCC000" />
+        <register type="NOA" address="0x00009888" value="0x1ABD00A8" />
+        <register type="NOA" address="0x00009888" value="0x0CD8C000" />
+        <register type="NOA" address="0x00009888" value="0x0ED84000" />
+        <register type="NOA" address="0x00009888" value="0x0EDB8000" />
+        <register type="NOA" address="0x00009888" value="0x18DB0800" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0254" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA00" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0EB84000" />
+        <register type="NOA" address="0x00009888" value="0x16B84000" />
+        <register type="NOA" address="0x00009888" value="0x18B8156A" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x18BAA000" />
+        <register type="NOA" address="0x00009888" value="0x1ABA0002" />
+        <register type="NOA" address="0x00009888" value="0x16934000" />
+        <register type="NOA" address="0x00009888" value="0x1893000A" />
+        <register type="NOA" address="0x00009888" value="0x0A947000" />
+        <register type="NOA" address="0x00009888" value="0x0C95C5C1" />
+        <register type="NOA" address="0x00009888" value="0x0E9500C3" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x0EB38000" />
+        <register type="NOA" address="0x00009888" value="0x16B30040" />
+        <register type="NOA" address="0x00009888" value="0x18B30020" />
+        <register type="NOA" address="0x00009888" value="0x06B48000" />
+        <register type="NOA" address="0x00009888" value="0x08B41000" />
+        <register type="NOA" address="0x00009888" value="0x0AB48000" />
+        <register type="NOA" address="0x00009888" value="0x06B5C500" />
+        <register type="NOA" address="0x00009888" value="0x08B500C3" />
+        <register type="NOA" address="0x00009888" value="0x0EB5C100" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x16D31500" />
+        <register type="NOA" address="0x00009888" value="0x08D4E000" />
+        <register type="NOA" address="0x00009888" value="0x08D5C100" />
+        <register type="NOA" address="0x00009888" value="0x0AD5C3C5" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA5" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800C42" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800063" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800800" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F8014A4" />
+        <register type="NOA" address="0x00009888" value="0x41801042" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x0000FE7F" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFBF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFF7" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FFF9" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="29598975-4785-43ab-a981-1dfa58d0e835"
+       chipset="BDW"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort1"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort0"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header12_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader12ReadyPort0"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort1"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header12_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader12ReadyPort1"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort0"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x16150000" />
+        <register type="NOA" address="0x00009888" value="0x16350000" />
+        <register type="NOA" address="0x00009888" value="0x16550000" />
+        <register type="NOA" address="0x00009888" value="0x16952E60" />
+        <register type="NOA" address="0x00009888" value="0x16B54D60" />
+        <register type="NOA" address="0x00009888" value="0x16D52E60" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5C4000" />
+        <register type="NOA" address="0x00009888" value="0x0E3D8000" />
+        <register type="NOA" address="0x00009888" value="0x183DA000" />
+        <register type="NOA" address="0x00009888" value="0x06588000" />
+        <register type="NOA" address="0x00009888" value="0x08588000" />
+        <register type="NOA" address="0x00009888" value="0x0A584000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B5800" />
+        <register type="NOA" address="0x00009888" value="0x1A5B000A" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA00" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18382A55" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x1A3A02A0" />
+        <register type="NOA" address="0x00009888" value="0x0E138000" />
+        <register type="NOA" address="0x00009888" value="0x16130500" />
+        <register type="NOA" address="0x00009888" value="0x06148000" />
+        <register type="NOA" address="0x00009888" value="0x08146000" />
+        <register type="NOA" address="0x00009888" value="0x0615C100" />
+        <register type="NOA" address="0x00009888" value="0x0815C500" />
+        <register type="NOA" address="0x00009888" value="0x0A1500C3" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x16335040" />
+        <register type="NOA" address="0x00009888" value="0x08349000" />
+        <register type="NOA" address="0x00009888" value="0x0A341000" />
+        <register type="NOA" address="0x00009888" value="0x083500C1" />
+        <register type="NOA" address="0x00009888" value="0x0A35C500" />
+        <register type="NOA" address="0x00009888" value="0x0C3500C3" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x1853002A" />
+        <register type="NOA" address="0x00009888" value="0x0A54E000" />
+        <register type="NOA" address="0x00009888" value="0x0C55C500" />
+        <register type="NOA" address="0x00009888" value="0x0E55C1C3" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x00DC8000" />
+        <register type="NOA" address="0x00009888" value="0x02DCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DC4000" />
+        <register type="NOA" address="0x00009888" value="0x04BD8000" />
+        <register type="NOA" address="0x00009888" value="0x06BD8000" />
+        <register type="NOA" address="0x00009888" value="0x02D8C000" />
+        <register type="NOA" address="0x00009888" value="0x02DB8000" />
+        <register type="NOA" address="0x00009888" value="0x04DB4000" />
+        <register type="NOA" address="0x00009888" value="0x06DB4000" />
+        <register type="NOA" address="0x00009888" value="0x08DB8000" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00AA" />
+        <register type="NOA" address="0x00009888" value="0x02B84000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x00B98000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0ABA8000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA8000" />
+        <register type="NOA" address="0x00009888" value="0x04938000" />
+        <register type="NOA" address="0x00009888" value="0x06938000" />
+        <register type="NOA" address="0x00009888" value="0x0494C000" />
+        <register type="NOA" address="0x00009888" value="0x0295CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x02B38000" />
+        <register type="NOA" address="0x00009888" value="0x08B38000" />
+        <register type="NOA" address="0x00009888" value="0x04B42000" />
+        <register type="NOA" address="0x00009888" value="0x06B41000" />
+        <register type="NOA" address="0x00009888" value="0x00B5C700" />
+        <register type="NOA" address="0x00009888" value="0x04B500CF" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x0AD38000" />
+        <register type="NOA" address="0x00009888" value="0x0CD38000" />
+        <register type="NOA" address="0x00009888" value="0x06D46000" />
+        <register type="NOA" address="0x00009888" value="0x04D5C700" />
+        <register type="NOA" address="0x00009888" value="0x06D500CF" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x258B555A" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800882" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45801082" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x478014A5" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800002" />
+        <register type="NOA" address="0x00009888" value="0x41800C62" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x0000FE7F" />
+        <register type="OA" address="0x00002780" value="0x00000000" />
+        <register type="OA" address="0x00002784" value="0x0000FF9F" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFFB" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FFFD" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen8"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="8fb61ba2-2fbb-454c-a136-2dec5a8a595e"
+       chipset="BDW"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 5 READ C 6 READ FADD C 7 READ FADD C 2 READ FADD C 3 READ FADD C 4 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x161503E0" />
+        <register type="NOA" address="0x00009888" value="0x163503E0" />
+        <register type="NOA" address="0x00009888" value="0x165503E0" />
+        <register type="NOA" address="0x00009888" value="0x169503E0" />
+        <register type="NOA" address="0x00009888" value="0x16B503E0" />
+        <register type="NOA" address="0x00009888" value="0x16D503E0" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x083D8000" />
+        <register type="NOA" address="0x00009888" value="0x04584000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00A8" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C388000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A8000" />
+        <register type="NOA" address="0x00009888" value="0x08138000" />
+        <register type="NOA" address="0x00009888" value="0x06141000" />
+        <register type="NOA" address="0x00009888" value="0x041500C3" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x0A338000" />
+        <register type="NOA" address="0x00009888" value="0x06342000" />
+        <register type="NOA" address="0x00009888" value="0x0435C300" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x0C538000" />
+        <register type="NOA" address="0x00009888" value="0x06544000" />
+        <register type="NOA" address="0x00009888" value="0x065500C3" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x00DC8000" />
+        <register type="NOA" address="0x00009888" value="0x02DC4000" />
+        <register type="NOA" address="0x00009888" value="0x02BD8000" />
+        <register type="NOA" address="0x00009888" value="0x00D88000" />
+        <register type="NOA" address="0x00009888" value="0x02DB4000" />
+        <register type="NOA" address="0x00009888" value="0x04DB8000" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0002" />
+        <register type="NOA" address="0x00009888" value="0x02B84000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B88000" />
+        <register type="NOA" address="0x00009888" value="0x00B98000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06BA8000" />
+        <register type="NOA" address="0x00009888" value="0x02938000" />
+        <register type="NOA" address="0x00009888" value="0x04942000" />
+        <register type="NOA" address="0x00009888" value="0x0095C300" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x04B38000" />
+        <register type="NOA" address="0x00009888" value="0x04B44000" />
+        <register type="NOA" address="0x00009888" value="0x02B500C3" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x06D38000" />
+        <register type="NOA" address="0x00009888" value="0x04D48000" />
+        <register type="NOA" address="0x00009888" value="0x02D5C300" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B3500" />
+        <register type="NOA" address="0x00009888" value="0x258B0005" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800C40" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41801482" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen8"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="e1743ca0-7fc8-410b-a066-de7bbb9280b7"
+       chipset="BDW"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x14100812" />
+        <register type="NOA" address="0x00009888" value="0x14125800" />
+        <register type="NOA" address="0x00009888" value="0x161200C0" />
+        <register type="NOA" address="0x00009888" value="0x14300812" />
+        <register type="NOA" address="0x00009888" value="0x14325800" />
+        <register type="NOA" address="0x00009888" value="0x163200C0" />
+        <register type="NOA" address="0x00009888" value="0x005C4000" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5CC000" />
+        <register type="NOA" address="0x00009888" value="0x003D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E3D8000" />
+        <register type="NOA" address="0x00009888" value="0x183D2800" />
+        <register type="NOA" address="0x00009888" value="0x00584000" />
+        <register type="NOA" address="0x00009888" value="0x06588000" />
+        <register type="NOA" address="0x00009888" value="0x0858C000" />
+        <register type="NOA" address="0x00009888" value="0x005B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B9400" />
+        <register type="NOA" address="0x00009888" value="0x1A5B002A" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA00" />
+        <register type="NOA" address="0x00009888" value="0x101F002A" />
+        <register type="NOA" address="0x00009888" value="0x00384000" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18380155" />
+        <register type="NOA" address="0x00009888" value="0x00392000" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x00100047" />
+        <register type="NOA" address="0x00009888" value="0x06101A80" />
+        <register type="NOA" address="0x00009888" value="0x10100000" />
+        <register type="NOA" address="0x00009888" value="0x0810C000" />
+        <register type="NOA" address="0x00009888" value="0x0811C000" />
+        <register type="NOA" address="0x00009888" value="0x08126151" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x00134000" />
+        <register type="NOA" address="0x00009888" value="0x0E134000" />
+        <register type="NOA" address="0x00009888" value="0x161300A0" />
+        <register type="NOA" address="0x00009888" value="0x0A301AC7" />
+        <register type="NOA" address="0x00009888" value="0x10300000" />
+        <register type="NOA" address="0x00009888" value="0x0C30C000" />
+        <register type="NOA" address="0x00009888" value="0x0C31C000" />
+        <register type="NOA" address="0x00009888" value="0x0C326151" />
+        <register type="NOA" address="0x00009888" value="0x10320000" />
+        <register type="NOA" address="0x00009888" value="0x16332A00" />
+        <register type="NOA" address="0x00009888" value="0x18330001" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A2AA0" />
+        <register type="NOA" address="0x00009888" value="0x238B0020" />
+        <register type="NOA" address="0x00009888" value="0x258B5550" />
+        <register type="NOA" address="0x00009888" value="0x278B0001" />
+        <register type="NOA" address="0x00009888" value="0x1F850080" />
+        <register type="NOA" address="0x00009888" value="0x2185AAA0" />
+        <register type="NOA" address="0x00009888" value="0x23850002" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830015" />
+        <register type="NOA" address="0x00009888" value="0x01844000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x11804000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800800" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800002" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800884" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800002" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="0a9eb7be-feee-4275-a139-6d9cedf0fdb0"
+       chipset="BDW"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x1AF00100" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x11850008" />
+        <register type="NOA" address="0x00009888" value="0x17830100" />
+        <register type="NOA" address="0x00009888" value="0x1A700100" />
+        <register type="NOA" address="0x00009888" value="0x1D940040" />
+        <register type="NOA" address="0x00009888" value="0x02F00085" />
+        <register type="NOA" address="0x00009888" value="0x10F00000" />
+        <register type="NOA" address="0x00009888" value="0x24F00000" />
+        <register type="NOA" address="0x00009888" value="0x078B0003" />
+        <register type="NOA" address="0x00009888" value="0x238B0400" />
+        <register type="NOA" address="0x00009888" value="0x258B0000" />
+        <register type="NOA" address="0x00009888" value="0x058C8000" />
+        <register type="NOA" address="0x00009888" value="0x038D2000" />
+        <register type="NOA" address="0x00009888" value="0x03850500" />
+        <register type="NOA" address="0x00009888" value="0x1F858800" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x05834055" />
+        <register type="NOA" address="0x00009888" value="0x11830000" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x0B838000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x03844000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x04708500" />
+        <register type="NOA" address="0x00009888" value="0x10700000" />
+        <register type="NOA" address="0x00009888" value="0x24700000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x4D801000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800004" />
+        <register type="NOA" address="0x00009888" value="0x418014A0" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen8"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="d6de6f55-e526-4f79-a6a6-d7315c09044e"
+       chipset="BDW"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x198B0000" />
+        <register type="NOA" address="0x00009888" value="0x078B0066" />
+        <register type="NOA" address="0x00009888" value="0x118B0000" />
+        <register type="NOA" address="0x00009888" value="0x258B0000" />
+        <register type="NOA" address="0x00009888" value="0x21850008" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="OGL OGL4 IO BB"
+       underscore_name="stc__pma_stall"
+       hw_config_guid="e713f347-953e-4d8c-b02f-6be31df2db2b"
+       chipset="BDW"
+       symbol_name="STC_PmaStall"
+       >
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0001" />
+        <register type="NOA" address="0x00009888" value="0x001F0015" />
+        <register type="NOA" address="0x00009888" value="0x041F4AC0" />
+        <register type="NOA" address="0x00009888" value="0x061F03D8" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A00A0" />
+        <register type="NOA" address="0x00009888" value="0x238B0020" />
+        <register type="NOA" address="0x00009888" value="0x258B0550" />
+        <register type="NOA" address="0x00009888" value="0x1F850080" />
+        <register type="NOA" address="0x00009888" value="0x21850AA0" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x01844000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B844000" />
+        <register type="NOA" address="0x00009888" value="0x11804000" />
+        <register type="NOA" address="0x00009888" value="0x17808000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B804000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x008000E1" />
+        <register type="OA" address="0x00002774" value="0x001FFFE0" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-bxt.xml b/lib/i915/perf-configs/oa-bxt.xml
new file mode 100644
index 00000000..c66e7d6e
--- /dev/null
+++ b/lib/i915/perf-configs/oa-bxt.xml
@@ -0,0 +1,9595 @@
+<?xml version="1.0"?>
+<metrics version="1562317147" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="22b9519a-e9ba-4c41-8b54-f4f8ca14fa0a"
+       chipset="BXT"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x03 UGTE"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C00F0" />
+        <register type="NOA" address="0x00009888" value="0x12120280" />
+        <register type="NOA" address="0x00009888" value="0x12320280" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x419000A0" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0800" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5900" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C4000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0010" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FCC00" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0002" />
+        <register type="NOA" address="0x00009888" value="0x1C2C0040" />
+        <register type="NOA" address="0x00009888" value="0x00101000" />
+        <register type="NOA" address="0x00009888" value="0x04101000" />
+        <register type="NOA" address="0x00009888" value="0x00114000" />
+        <register type="NOA" address="0x00009888" value="0x08114000" />
+        <register type="NOA" address="0x00009888" value="0x00120020" />
+        <register type="NOA" address="0x00009888" value="0x08120021" />
+        <register type="NOA" address="0x00009888" value="0x00141000" />
+        <register type="NOA" address="0x00009888" value="0x08141000" />
+        <register type="NOA" address="0x00009888" value="0x02308000" />
+        <register type="NOA" address="0x00009888" value="0x04302000" />
+        <register type="NOA" address="0x00009888" value="0x06318000" />
+        <register type="NOA" address="0x00009888" value="0x08318000" />
+        <register type="NOA" address="0x00009888" value="0x06320800" />
+        <register type="NOA" address="0x00009888" value="0x08320840" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x06344000" />
+        <register type="NOA" address="0x00009888" value="0x08344000" />
+        <register type="NOA" address="0x00009888" value="0x0D931831" />
+        <register type="NOA" address="0x00009888" value="0x0F939F3F" />
+        <register type="NOA" address="0x00009888" value="0x01939E80" />
+        <register type="NOA" address="0x00009888" value="0x039303BC" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1993002A" />
+        <register type="NOA" address="0x00009888" value="0x07930000" />
+        <register type="NOA" address="0x00009888" value="0x09930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900177" />
+        <register type="NOA" address="0x00009888" value="0x1F900187" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x53901110" />
+        <register type="NOA" address="0x00009888" value="0x43900423" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900C02" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900020" />
+        <register type="NOA" address="0x00009888" value="0x59901111" />
+        <register type="NOA" address="0x00009888" value="0x4B900421" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="012d72cf-82a9-4d25-8ddf-74076fd30797"
+       chipset="BXT"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL  $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x002D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D4000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E1400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5100" />
+        <register type="NOA" address="0x00009888" value="0x102E0114" />
+        <register type="NOA" address="0x00009888" value="0x044CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C4000" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x004EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F6B42" />
+        <register type="NOA" address="0x00009888" value="0x064F6200" />
+        <register type="NOA" address="0x00009888" value="0x084F4100" />
+        <register type="NOA" address="0x00009888" value="0x0A4F0061" />
+        <register type="NOA" address="0x00009888" value="0x0C4F6C4C" />
+        <register type="NOA" address="0x00009888" value="0x0E4F4B00" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0000" />
+        <register type="NOA" address="0x00009888" value="0x180F5000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F8800" />
+        <register type="NOA" address="0x00009888" value="0x1C0F08A2" />
+        <register type="NOA" address="0x00009888" value="0x182C4000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C1451" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0010" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x19938A28" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x19900177" />
+        <register type="NOA" address="0x00009888" value="0x1B900178" />
+        <register type="NOA" address="0x00009888" value="0x1D900125" />
+        <register type="NOA" address="0x00009888" value="0x1F900123" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x53901000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="ce416533-e49e-4211-80af-ec513590a914"
+       chipset="BXT"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C2E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A2F0000" />
+        <register type="NOA" address="0x00009888" value="0x10186800" />
+        <register type="NOA" address="0x00009888" value="0x11810019" />
+        <register type="NOA" address="0x00009888" value="0x15810013" />
+        <register type="NOA" address="0x00009888" value="0x13820020" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x17840000" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x21860000" />
+        <register type="NOA" address="0x00009888" value="0x178703E0" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x022E5400" />
+        <register type="NOA" address="0x00009888" value="0x002E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0080" />
+        <register type="NOA" address="0x00009888" value="0x082F0040" />
+        <register type="NOA" address="0x00009888" value="0x002F0000" />
+        <register type="NOA" address="0x00009888" value="0x06143000" />
+        <register type="NOA" address="0x00009888" value="0x06174000" />
+        <register type="NOA" address="0x00009888" value="0x06180012" />
+        <register type="NOA" address="0x00009888" value="0x00180000" />
+        <register type="NOA" address="0x00009888" value="0x0D804000" />
+        <register type="NOA" address="0x00009888" value="0x0F804000" />
+        <register type="NOA" address="0x00009888" value="0x05804000" />
+        <register type="NOA" address="0x00009888" value="0x09810200" />
+        <register type="NOA" address="0x00009888" value="0x0B810030" />
+        <register type="NOA" address="0x00009888" value="0x03810003" />
+        <register type="NOA" address="0x00009888" value="0x21819140" />
+        <register type="NOA" address="0x00009888" value="0x23819050" />
+        <register type="NOA" address="0x00009888" value="0x25810018" />
+        <register type="NOA" address="0x00009888" value="0x0B820980" />
+        <register type="NOA" address="0x00009888" value="0x03820D80" />
+        <register type="NOA" address="0x00009888" value="0x11820000" />
+        <register type="NOA" address="0x00009888" value="0x0182C000" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x09824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0D830004" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x0F831000" />
+        <register type="NOA" address="0x00009888" value="0x01848072" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x09844000" />
+        <register type="NOA" address="0x00009888" value="0x0F848000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x09860092" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x01869100" />
+        <register type="NOA" address="0x00009888" value="0x0F870065" />
+        <register type="NOA" address="0x00009888" value="0x01870000" />
+        <register type="NOA" address="0x00009888" value="0x19930800" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1B952000" />
+        <register type="NOA" address="0x00009888" value="0x1D955055" />
+        <register type="NOA" address="0x00009888" value="0x1F951455" />
+        <register type="NOA" address="0x00009888" value="0x0992A000" />
+        <register type="NOA" address="0x00009888" value="0x0F928000" />
+        <register type="NOA" address="0x00009888" value="0x1192A800" />
+        <register type="NOA" address="0x00009888" value="0x1392028A" />
+        <register type="NOA" address="0x00009888" value="0x0B92A000" />
+        <register type="NOA" address="0x00009888" value="0x0D922000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C01" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900863" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900061" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C22" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="398e2452-18d7-42d0-b241-e4d0a9148ada"
+       chipset="BXT"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800343" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x41900003" />
+        <register type="NOA" address="0x00009888" value="0x03803180" />
+        <register type="NOA" address="0x00009888" value="0x058035E2" />
+        <register type="NOA" address="0x00009888" value="0x0780006A" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x2181A000" />
+        <register type="NOA" address="0x00009888" value="0x2381000A" />
+        <register type="NOA" address="0x00009888" value="0x1D950550" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D92A000" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x13900170" />
+        <register type="NOA" address="0x00009888" value="0x21900171" />
+        <register type="NOA" address="0x00009888" value="0x23900172" />
+        <register type="NOA" address="0x00009888" value="0x25900173" />
+        <register type="NOA" address="0x00009888" value="0x27900174" />
+        <register type="NOA" address="0x00009888" value="0x29900175" />
+        <register type="NOA" address="0x00009888" value="0x2B900176" />
+        <register type="NOA" address="0x00009888" value="0x2D900177" />
+        <register type="NOA" address="0x00009888" value="0x2F90017F" />
+        <register type="NOA" address="0x00009888" value="0x31900125" />
+        <register type="NOA" address="0x00009888" value="0x15900123" />
+        <register type="NOA" address="0x00009888" value="0x17900121" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47901080" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49901084" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B901084" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900004" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="d324a0d6-7269-4847-a5c2-6f71ddc7fed5"
+       chipset="BXT"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800343" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F900000" />
+        <register type="NOA" address="0x00009888" value="0x41900080" />
+        <register type="NOA" address="0x00009888" value="0x03803180" />
+        <register type="NOA" address="0x00009888" value="0x058035E2" />
+        <register type="NOA" address="0x00009888" value="0x0780006A" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x2181A000" />
+        <register type="NOA" address="0x00009888" value="0x2381000A" />
+        <register type="NOA" address="0x00009888" value="0x1D950550" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D92A000" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x13900180" />
+        <register type="NOA" address="0x00009888" value="0x21900181" />
+        <register type="NOA" address="0x00009888" value="0x23900182" />
+        <register type="NOA" address="0x00009888" value="0x25900183" />
+        <register type="NOA" address="0x00009888" value="0x27900184" />
+        <register type="NOA" address="0x00009888" value="0x29900185" />
+        <register type="NOA" address="0x00009888" value="0x2B900186" />
+        <register type="NOA" address="0x00009888" value="0x2D900187" />
+        <register type="NOA" address="0x00009888" value="0x2F900170" />
+        <register type="NOA" address="0x00009888" value="0x31900125" />
+        <register type="NOA" address="0x00009888" value="0x15900123" />
+        <register type="NOA" address="0x00009888" value="0x17900121" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47901080" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49901084" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B901084" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900004" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="caf3596a-7bb1-4dec-b3b3-2a080d283b49"
+       chipset="BXT"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C0160" />
+        <register type="NOA" address="0x00009888" value="0x161C0015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x002D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5515" />
+        <register type="NOA" address="0x00009888" value="0x102E0155" />
+        <register type="NOA" address="0x00009888" value="0x044CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E4CC000" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x004EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084EA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4F4B41" />
+        <register type="NOA" address="0x00009888" value="0x004F4200" />
+        <register type="NOA" address="0x00009888" value="0x024F404C" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0A1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0031" />
+        <register type="NOA" address="0x00009888" value="0x061C1900" />
+        <register type="NOA" address="0x00009888" value="0x081C1A33" />
+        <register type="NOA" address="0x00009888" value="0x0A1C1B35" />
+        <register type="NOA" address="0x00009888" value="0x0C1C3337" />
+        <register type="NOA" address="0x00009888" value="0x041C31C7" />
+        <register type="NOA" address="0x00009888" value="0x180F5000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FA8AA" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0AAA" />
+        <register type="NOA" address="0x00009888" value="0x182C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C6AAA" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C2950" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x1993AAAA" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900400" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="49b956e2-d5b9-47e0-9d8a-cee5e8cec527"
+       chipset="BXT"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C03B0" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E1500" />
+        <register type="NOA" address="0x00009888" value="0x102E0140" />
+        <register type="NOA" address="0x00009888" value="0x044C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4CC000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x004E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x1A4F4001" />
+        <register type="NOA" address="0x00009888" value="0x1C4F5005" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x180F1000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FA800" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C4000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C4015" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x03931980" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x1993A00A" />
+        <register type="NOA" address="0x00009888" value="0x07930000" />
+        <register type="NOA" address="0x00009888" value="0x09930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900177" />
+        <register type="NOA" address="0x00009888" value="0x1F900178" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x53901000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="ad9d9bc2-ccb7-4f5d-adbb-b4e67e615efd"
+       chipset="BXT"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x022D4000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0055" />
+        <register type="NOA" address="0x00009888" value="0x064C8000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x024F6100" />
+        <register type="NOA" address="0x00009888" value="0x044F416B" />
+        <register type="NOA" address="0x00009888" value="0x064F004B" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F02A8" />
+        <register type="NOA" address="0x00009888" value="0x1A2C5500" />
+        <register type="NOA" address="0x00009888" value="0x0F808000" />
+        <register type="NOA" address="0x00009888" value="0x25810020" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1F951000" />
+        <register type="NOA" address="0x00009888" value="0x13920200" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="bde7b434-349c-4aad-8596-eb23c0352168"
+       chipset="BXT"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x03 UGTE"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12643400" />
+        <register type="NOA" address="0x00009888" value="0x12653400" />
+        <register type="NOA" address="0x00009888" value="0x106C6800" />
+        <register type="NOA" address="0x00009888" value="0x126C001E" />
+        <register type="NOA" address="0x00009888" value="0x166C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E0154" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0055" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F5500" />
+        <register type="NOA" address="0x00009888" value="0x1A4F1554" />
+        <register type="NOA" address="0x00009888" value="0x0A640024" />
+        <register type="NOA" address="0x00009888" value="0x10640000" />
+        <register type="NOA" address="0x00009888" value="0x04640000" />
+        <register type="NOA" address="0x00009888" value="0x0C650024" />
+        <register type="NOA" address="0x00009888" value="0x10650000" />
+        <register type="NOA" address="0x00009888" value="0x06650000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0900" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0AA0" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F02AA" />
+        <register type="NOA" address="0x00009888" value="0x1C2C5400" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C5550" />
+        <register type="NOA" address="0x00009888" value="0x1993AA00" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900421" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x03 ULT"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14640340" />
+        <register type="NOA" address="0x00009888" value="0x14650340" />
+        <register type="NOA" address="0x00009888" value="0x106C6800" />
+        <register type="NOA" address="0x00009888" value="0x126C001E" />
+        <register type="NOA" address="0x00009888" value="0x166C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E0154" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0055" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F5500" />
+        <register type="NOA" address="0x00009888" value="0x1A4F1554" />
+        <register type="NOA" address="0x00009888" value="0x04642400" />
+        <register type="NOA" address="0x00009888" value="0x22640000" />
+        <register type="NOA" address="0x00009888" value="0x1A640000" />
+        <register type="NOA" address="0x00009888" value="0x06650024" />
+        <register type="NOA" address="0x00009888" value="0x22650000" />
+        <register type="NOA" address="0x00009888" value="0x1C650000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0900" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0AA0" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F02AA" />
+        <register type="NOA" address="0x00009888" value="0x1C2C5400" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C5550" />
+        <register type="NOA" address="0x00009888" value="0x1993AA00" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900421" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="f3d845e6-bfc3-4ffe-b0e5-dddc80c21f07"
+       chipset="BXT"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102D7800" />
+        <register type="NOA" address="0x00009888" value="0x122D79E0" />
+        <register type="NOA" address="0x00009888" value="0x0C2F0004" />
+        <register type="NOA" address="0x00009888" value="0x100E3800" />
+        <register type="NOA" address="0x00009888" value="0x180F0005" />
+        <register type="NOA" address="0x00009888" value="0x002D0940" />
+        <register type="NOA" address="0x00009888" value="0x022D802F" />
+        <register type="NOA" address="0x00009888" value="0x042D4013" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0050" />
+        <register type="NOA" address="0x00009888" value="0x022F0010" />
+        <register type="NOA" address="0x00009888" value="0x002F0000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x040E0480" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x060F0027" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F0040" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x439014A0" />
+        <register type="NOA" address="0x00009888" value="0x459000A4" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="a53d620b-c14e-49df-bd27-e076b3fb98f3"
+       chipset="BXT"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121300A0" />
+        <register type="NOA" address="0x00009888" value="0x141600AB" />
+        <register type="NOA" address="0x00009888" value="0x123300A0" />
+        <register type="NOA" address="0x00009888" value="0x143600AB" />
+        <register type="NOA" address="0x00009888" value="0x125300A0" />
+        <register type="NOA" address="0x00009888" value="0x145600AB" />
+        <register type="NOA" address="0x00009888" value="0x0C2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E01A0" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0065" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F023F" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0003" />
+        <register type="NOA" address="0x00009888" value="0x1A2CC030" />
+        <register type="NOA" address="0x00009888" value="0x04132180" />
+        <register type="NOA" address="0x00009888" value="0x02130000" />
+        <register type="NOA" address="0x00009888" value="0x0C148000" />
+        <register type="NOA" address="0x00009888" value="0x0E142000" />
+        <register type="NOA" address="0x00009888" value="0x04148000" />
+        <register type="NOA" address="0x00009888" value="0x1E150140" />
+        <register type="NOA" address="0x00009888" value="0x1C150040" />
+        <register type="NOA" address="0x00009888" value="0x0C163000" />
+        <register type="NOA" address="0x00009888" value="0x0E160068" />
+        <register type="NOA" address="0x00009888" value="0x10160000" />
+        <register type="NOA" address="0x00009888" value="0x18160000" />
+        <register type="NOA" address="0x00009888" value="0x0A164000" />
+        <register type="NOA" address="0x00009888" value="0x04330043" />
+        <register type="NOA" address="0x00009888" value="0x02330000" />
+        <register type="NOA" address="0x00009888" value="0x0234A000" />
+        <register type="NOA" address="0x00009888" value="0x04342000" />
+        <register type="NOA" address="0x00009888" value="0x1C350015" />
+        <register type="NOA" address="0x00009888" value="0x02363460" />
+        <register type="NOA" address="0x00009888" value="0x10360000" />
+        <register type="NOA" address="0x00009888" value="0x04360000" />
+        <register type="NOA" address="0x00009888" value="0x06360000" />
+        <register type="NOA" address="0x00009888" value="0x08364000" />
+        <register type="NOA" address="0x00009888" value="0x06530043" />
+        <register type="NOA" address="0x00009888" value="0x02530000" />
+        <register type="NOA" address="0x00009888" value="0x0E548000" />
+        <register type="NOA" address="0x00009888" value="0x00548000" />
+        <register type="NOA" address="0x00009888" value="0x06542000" />
+        <register type="NOA" address="0x00009888" value="0x1E550400" />
+        <register type="NOA" address="0x00009888" value="0x1A552000" />
+        <register type="NOA" address="0x00009888" value="0x1C550100" />
+        <register type="NOA" address="0x00009888" value="0x0E563000" />
+        <register type="NOA" address="0x00009888" value="0x00563400" />
+        <register type="NOA" address="0x00009888" value="0x10560000" />
+        <register type="NOA" address="0x00009888" value="0x18560000" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x0C564000" />
+        <register type="NOA" address="0x00009888" value="0x1993A800" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B9014A0" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900820" />
+        <register type="NOA" address="0x00009888" value="0x45901022" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="8a44b172-6e1d-445f-8937-c06cc487ba39"
+       chipset="BXT"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A0000" />
+        <register type="NOA" address="0x00009888" value="0x143A0000" />
+        <register type="NOA" address="0x00009888" value="0x145A0000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E0150" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E006A" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0BC0" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F0302" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0003" />
+        <register type="NOA" address="0x00009888" value="0x1A2C00F0" />
+        <register type="NOA" address="0x00009888" value="0x021A3080" />
+        <register type="NOA" address="0x00009888" value="0x041A31E5" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x0414A000" />
+        <register type="NOA" address="0x00009888" value="0x1C150054" />
+        <register type="NOA" address="0x00009888" value="0x06168000" />
+        <register type="NOA" address="0x00009888" value="0x08168000" />
+        <register type="NOA" address="0x00009888" value="0x0A168000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A3280" />
+        <register type="NOA" address="0x00009888" value="0x0E3A0063" />
+        <register type="NOA" address="0x00009888" value="0x063A0061" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x0C348000" />
+        <register type="NOA" address="0x00009888" value="0x0E342000" />
+        <register type="NOA" address="0x00009888" value="0x06342000" />
+        <register type="NOA" address="0x00009888" value="0x1E350140" />
+        <register type="NOA" address="0x00009888" value="0x1C350100" />
+        <register type="NOA" address="0x00009888" value="0x18360028" />
+        <register type="NOA" address="0x00009888" value="0x0C368000" />
+        <register type="NOA" address="0x00009888" value="0x0E5A3080" />
+        <register type="NOA" address="0x00009888" value="0x005A3280" />
+        <register type="NOA" address="0x00009888" value="0x025A0063" />
+        <register type="NOA" address="0x00009888" value="0x0E548000" />
+        <register type="NOA" address="0x00009888" value="0x00548000" />
+        <register type="NOA" address="0x00009888" value="0x02542000" />
+        <register type="NOA" address="0x00009888" value="0x1E550400" />
+        <register type="NOA" address="0x00009888" value="0x1A552000" />
+        <register type="NOA" address="0x00009888" value="0x1C550001" />
+        <register type="NOA" address="0x00009888" value="0x18560080" />
+        <register type="NOA" address="0x00009888" value="0x02568000" />
+        <register type="NOA" address="0x00009888" value="0x04568000" />
+        <register type="NOA" address="0x00009888" value="0x1993A800" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x45901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="9d4643f8-aa05-482e-8193-070a8ab0d117"
+       chipset="BXT"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A026B" />
+        <register type="NOA" address="0x00009888" value="0x143A0173" />
+        <register type="NOA" address="0x00009888" value="0x145A026B" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0069" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x180F6000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F030A" />
+        <register type="NOA" address="0x00009888" value="0x1A2C03C0" />
+        <register type="NOA" address="0x00009888" value="0x041A37E7" />
+        <register type="NOA" address="0x00009888" value="0x021A0000" />
+        <register type="NOA" address="0x00009888" value="0x0414A000" />
+        <register type="NOA" address="0x00009888" value="0x1C150050" />
+        <register type="NOA" address="0x00009888" value="0x08168000" />
+        <register type="NOA" address="0x00009888" value="0x0A168000" />
+        <register type="NOA" address="0x00009888" value="0x003A3380" />
+        <register type="NOA" address="0x00009888" value="0x063A006F" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x00348000" />
+        <register type="NOA" address="0x00009888" value="0x06342000" />
+        <register type="NOA" address="0x00009888" value="0x1A352000" />
+        <register type="NOA" address="0x00009888" value="0x1C350100" />
+        <register type="NOA" address="0x00009888" value="0x02368000" />
+        <register type="NOA" address="0x00009888" value="0x0C368000" />
+        <register type="NOA" address="0x00009888" value="0x025A37E7" />
+        <register type="NOA" address="0x00009888" value="0x0254A000" />
+        <register type="NOA" address="0x00009888" value="0x1C550005" />
+        <register type="NOA" address="0x00009888" value="0x04568000" />
+        <register type="NOA" address="0x00009888" value="0x06568000" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900020" />
+        <register type="NOA" address="0x00009888" value="0x45901080" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="fa6ecf21-2cb8-4d0b-9308-6e4a7b4ca87a"
+       chipset="BXT"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A001F" />
+        <register type="NOA" address="0x00009888" value="0x143A001F" />
+        <register type="NOA" address="0x00009888" value="0x145A001F" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0094" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F00E0" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0C00" />
+        <register type="NOA" address="0x00009888" value="0x061A0063" />
+        <register type="NOA" address="0x00009888" value="0x021A0000" />
+        <register type="NOA" address="0x00009888" value="0x06142000" />
+        <register type="NOA" address="0x00009888" value="0x1C150100" />
+        <register type="NOA" address="0x00009888" value="0x0C168000" />
+        <register type="NOA" address="0x00009888" value="0x043A3180" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x04348000" />
+        <register type="NOA" address="0x00009888" value="0x1C350040" />
+        <register type="NOA" address="0x00009888" value="0x0A368000" />
+        <register type="NOA" address="0x00009888" value="0x045A0063" />
+        <register type="NOA" address="0x00009888" value="0x025A0000" />
+        <register type="NOA" address="0x00009888" value="0x04542000" />
+        <register type="NOA" address="0x00009888" value="0x1C550010" />
+        <register type="NOA" address="0x00009888" value="0x08568000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900004" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="c9f5fa3a-d14f-400c-a89a-211206b00ee7"
+       chipset="BXT"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C00" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x21C05800" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x23810008" />
+        <register type="NOA" address="0x00009888" value="0x07960025" />
+        <register type="NOA" address="0x00009888" value="0x1D960000" />
+        <register type="NOA" address="0x00009888" value="0x0F960000" />
+        <register type="NOA" address="0x00009888" value="0x0B934000" />
+        <register type="NOA" address="0x00009888" value="0x09948000" />
+        <register type="NOA" address="0x00009888" value="0x05950085" />
+        <register type="NOA" address="0x00009888" value="0x11950000" />
+        <register type="NOA" address="0x00009888" value="0x1D950400" />
+        <register type="NOA" address="0x00009888" value="0x0B924000" />
+        <register type="NOA" address="0x00009888" value="0x0D922000" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x0BC000A5" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900442" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00078000" />
+        <register type="OA" address="0x00002774" value="0x00000FFF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="5ee72f5c-092f-421e-8b70-225f7c3e9612"
+       chipset="BXT"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800000" />
+        <register type="NOA" address="0x00009888" value="0x07800063" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x23810008" />
+        <register type="NOA" address="0x00009888" value="0x1D950400" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="d49cd0d8-8c7f-4465-94fc-51e08c9050bc"
+       chipset="BXT"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x124C3080" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5500" />
+        <register type="NOA" address="0x00009888" value="0x102E0001" />
+        <register type="NOA" address="0x00009888" value="0x004C0045" />
+        <register type="NOA" address="0x00009888" value="0x064C2300" />
+        <register type="NOA" address="0x00009888" value="0x084C26C4" />
+        <register type="NOA" address="0x00009888" value="0x0A4C264E" />
+        <register type="NOA" address="0x00009888" value="0x164C0000" />
+        <register type="NOA" address="0x00009888" value="0x044C0000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C0000" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x199300AA" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-cflgt2.xml b/lib/i915/perf-configs/oa-cflgt2.xml
new file mode 100644
index 00000000..4b465d68
--- /dev/null
+++ b/lib/i915/perf-configs/oa-cflgt2.xml
@@ -0,0 +1,10866 @@
+<?xml version="1.0"?>
+<metrics version="1562317148" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="7fa796a4-0c7a-4201-afc6-cff0b2f528a2"
+       chipset="CFLGT2"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0080" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C2200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190001F" />
+        <register type="NOA" address="0x00009888" value="0x51904400" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C21" />
+        <register type="NOA" address="0x00009888" value="0x47900061" />
+        <register type="NOA" address="0x00009888" value="0x57904440" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900004" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="dc8cf7ea-26b4-4478-ac93-dab174f92ac0"
+       chipset="CFLGT2"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900422" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="2221e4d5-ed7b-445e-b2cc-3de1b97f4d42"
+       chipset="CFLGT2"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900440" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900C21" />
+        <register type="NOA" address="0x00009888" value="0x57900400" />
+        <register type="NOA" address="0x00009888" value="0x49900042" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900024" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900841" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="82096a90-e2fa-4f38-ac14-562b2496933a"
+       chipset="CFLGT2"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="9f638880-02e9-4a8d-896a-7670a3bf0d35"
+       chipset="CFLGT2"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="8d4ad934-7c16-43d5-845a-51067a4c8e2f"
+       chipset="CFLGT2"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="4389cf07-1424-4963-b2d2-64fcec75406d"
+       chipset="CFLGT2"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="ac544b3a-ff78-46ea-9808-ee6fef0978b4"
+       chipset="CFLGT2"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="a35c5867-0ab8-4d45-8fc1-eb0906f0eff5"
+       chipset="CFLGT2"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="bb4bcce9-2cbb-4818-9e49-67ce2c99cd25"
+       chipset="CFLGT2"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="9e1229f8-d87f-4f44-b067-3544e17195aa"
+       chipset="CFLGT2"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="3e91908a-1c70-4004-b2ab-a10ef14f24f9"
+       chipset="CFLGT2"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="9a6ba957-7955-4a09-a8ce-083030ba3c1f"
+       chipset="CFLGT2"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="c54e7ca3-c60c-4396-ac3d-f9899c9a6ee4"
+       chipset="CFLGT2"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="e438cd5d-1da7-46c6-9823-4780f370d11d"
+       chipset="CFLGT2"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="5f679fb0-909e-4c0e-b4b2-8e801f83e71b"
+       chipset="CFLGT2"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006C" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x1190E000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C00" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="0d09ba9a-1d1c-457d-83e2-74ac448014d6"
+       chipset="CFLGT2"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x143A5800" />
+        <register type="NOA" address="0x00009888" value="0x163A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12380240" />
+        <register type="NOA" address="0x00009888" value="0x14380002" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C1500" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F9500" />
+        <register type="NOA" address="0x00009888" value="0x100F002A" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x0A2DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C2DC000" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x06393000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A28C1" />
+        <register type="NOA" address="0x00009888" value="0x003A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A33F000" />
+        <register type="NOA" address="0x00009888" value="0x0C33F000" />
+        <register type="NOA" address="0x00009888" value="0x0A37A000" />
+        <register type="NOA" address="0x00009888" value="0x0C37A000" />
+        <register type="NOA" address="0x00009888" value="0x0A380977" />
+        <register type="NOA" address="0x00009888" value="0x08380000" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x06383000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900800" />
+        <register type="NOA" address="0x00009888" value="0x47901000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900844" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="e2f162ae-5732-4af0-8b11-69510f57094a"
+       chipset="CFLGT2"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C00" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x19C05800" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x07960025" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x1B930062" />
+        <register type="NOA" address="0x00009888" value="0x17948000" />
+        <register type="NOA" address="0x00009888" value="0x1B940008" />
+        <register type="NOA" address="0x00009888" value="0x05950075" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x05C08500" />
+        <register type="NOA" address="0x00009888" value="0x25C00000" />
+        <register type="NOA" address="0x00009888" value="0x1BC00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C60" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00078000" />
+        <register type="OA" address="0x00002774" value="0x00000FFF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9.5"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="74fb4902-d3d3-4237-9e90-cbdc68d0a446"
+       chipset="CFLGT2"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="5ccbf9fb-6bf2-456b-a749-bdff7b1aff13"
+       chipset="CFLGT2"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-cflgt3.xml b/lib/i915/perf-configs/oa-cflgt3.xml
new file mode 100644
index 00000000..9a39a493
--- /dev/null
+++ b/lib/i915/perf-configs/oa-cflgt3.xml
@@ -0,0 +1,10933 @@
+<?xml version="1.0"?>
+<metrics version="1562317148" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="b316bcab-212f-4228-97de-af6b5a1a2ea1"
+       chipset="CFLGT3"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x16EC01E0" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0380" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0002" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x100F0001" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CA200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x1ACE0200" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5300" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1CEC0000" />
+        <register type="NOA" address="0x00009888" value="0x0A9B8000" />
+        <register type="NOA" address="0x00009888" value="0x1C9C0002" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0002" />
+        <register type="NOA" address="0x00009888" value="0x0A8D8000" />
+        <register type="NOA" address="0x00009888" value="0x108F0001" />
+        <register type="NOA" address="0x00009888" value="0x16AC8000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51902240" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x55900242" />
+        <register type="NOA" address="0x00009888" value="0x45900084" />
+        <register type="NOA" address="0x00009888" value="0x47901400" />
+        <register type="NOA" address="0x00009888" value="0x57902220" />
+        <register type="NOA" address="0x00009888" value="0x49900C60" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900002" />
+        <register type="NOA" address="0x00009888" value="0x43900C63" />
+        <register type="NOA" address="0x00009888" value="0x53902222" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="607f9cc8-e026-4d5f-bfad-45c77eabc150"
+       chipset="CFLGT3"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900422" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="9875e050-b1bc-45e6-a6ab-665594601df9"
+       chipset="CFLGT3"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900440" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900C21" />
+        <register type="NOA" address="0x00009888" value="0x57900400" />
+        <register type="NOA" address="0x00009888" value="0x49900042" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900024" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900841" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="49c65f34-e625-4ca4-86b7-88693e624d4c"
+       chipset="CFLGT3"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="45c9e8ee-2998-4d83-88e8-9cb7e03287bf"
+       chipset="CFLGT3"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="bac415ce-d7a2-4f8d-9b16-834deba7330e"
+       chipset="CFLGT3"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="a8cfca44-0e74-4338-9e57-3daad98957dd"
+       chipset="CFLGT3"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="c4bee67c-0de6-4bc2-9900-5388dcc8adca"
+       chipset="CFLGT3"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="2f77a650-54a6-4777-98dc-e49000c13ceb"
+       chipset="CFLGT3"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="61cf6b31-9ddd-4deb-bae5-7339dd1f63b3"
+       chipset="CFLGT3"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="1421ea8b-a4c9-4383-922a-60ba96c42f24"
+       chipset="CFLGT3"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="6e1f0a90-c65f-4da9-86d0-c79b3c0063f6"
+       chipset="CFLGT3"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="7cb05eab-0857-4189-93bc-09326d298637"
+       chipset="CFLGT3"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="05a06d02-0c12-486b-bb1d-9be053848980"
+       chipset="CFLGT3"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="cddbd1dc-41a2-4fe4-8b05-3d2773120814"
+       chipset="CFLGT3"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="e61ae394-9d9e-4204-a735-1dad7e44d953"
+       chipset="CFLGT3"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 5 READ C 6 READ FADD C 7 READ FADD C 2 READ FADD C 3 READ FADD C 4 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x129203E0" />
+        <register type="NOA" address="0x00009888" value="0x12B203E0" />
+        <register type="NOA" address="0x00009888" value="0x12D203E0" />
+        <register type="NOA" address="0x00009888" value="0x024EC000" />
+        <register type="NOA" address="0x00009888" value="0x044EC000" />
+        <register type="NOA" address="0x00009888" value="0x064EC000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0042" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006D" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x00AF8000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC0001" />
+        <register type="NOA" address="0x00009888" value="0x008D8000" />
+        <register type="NOA" address="0x00009888" value="0x028DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F0001" />
+        <register type="NOA" address="0x00009888" value="0x06AC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AD4000" />
+        <register type="NOA" address="0x00009888" value="0x02908000" />
+        <register type="NOA" address="0x00009888" value="0x02918000" />
+        <register type="NOA" address="0x00009888" value="0x02921980" />
+        <register type="NOA" address="0x00009888" value="0x00920000" />
+        <register type="NOA" address="0x00009888" value="0x02934000" />
+        <register type="NOA" address="0x00009888" value="0x02B04000" />
+        <register type="NOA" address="0x00009888" value="0x02B14000" />
+        <register type="NOA" address="0x00009888" value="0x02B20033" />
+        <register type="NOA" address="0x00009888" value="0x00B20000" />
+        <register type="NOA" address="0x00009888" value="0x02B31000" />
+        <register type="NOA" address="0x00009888" value="0x00D08000" />
+        <register type="NOA" address="0x00009888" value="0x00D18000" />
+        <register type="NOA" address="0x00009888" value="0x00D21980" />
+        <register type="NOA" address="0x00009888" value="0x00D34000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900002" />
+        <register type="NOA" address="0x00009888" value="0x53900420" />
+        <register type="NOA" address="0x00009888" value="0x459000A1" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="94272ad9-45ee-4e34-b7a7-51546cd6405c"
+       chipset="CFLGT3"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x149A5800" />
+        <register type="NOA" address="0x00009888" value="0x169A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12980240" />
+        <register type="NOA" address="0x00009888" value="0x14980002" />
+        <register type="NOA" address="0x00009888" value="0x1A4E3FC0" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C9500" />
+        <register type="NOA" address="0x00009888" value="0x0C4C002A" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0015" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C000A" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x04AFC000" />
+        <register type="NOA" address="0x00009888" value="0x06AF3000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0015" />
+        <register type="NOA" address="0x00009888" value="0x0A8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F4000" />
+        <register type="NOA" address="0x00009888" value="0x108F0015" />
+        <register type="NOA" address="0x00009888" value="0x16ACA000" />
+        <register type="NOA" address="0x00009888" value="0x18AC000A" />
+        <register type="NOA" address="0x00009888" value="0x06993000" />
+        <register type="NOA" address="0x00009888" value="0x0C9A28C1" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A93F000" />
+        <register type="NOA" address="0x00009888" value="0x0C93F000" />
+        <register type="NOA" address="0x00009888" value="0x0A97A000" />
+        <register type="NOA" address="0x00009888" value="0x0C97A000" />
+        <register type="NOA" address="0x00009888" value="0x0A980977" />
+        <register type="NOA" address="0x00009888" value="0x08980000" />
+        <register type="NOA" address="0x00009888" value="0x04980000" />
+        <register type="NOA" address="0x00009888" value="0x06983000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900040" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900004" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x479008A5" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900002" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="22b7e0c2-cade-425f-b099-34479768c72a"
+       chipset="CFLGT3"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19D05800" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C25" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x19C05800" />
+        <register type="NOA" address="0x00009888" value="0x05D00085" />
+        <register type="NOA" address="0x00009888" value="0x25D00000" />
+        <register type="NOA" address="0x00009888" value="0x09D54000" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0996C000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x19938000" />
+        <register type="NOA" address="0x00009888" value="0x1B930068" />
+        <register type="NOA" address="0x00009888" value="0x15948000" />
+        <register type="NOA" address="0x00009888" value="0x1B94000C" />
+        <register type="NOA" address="0x00009888" value="0x03957500" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x17950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x07928000" />
+        <register type="NOA" address="0x00009888" value="0x03988000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x05C08500" />
+        <register type="NOA" address="0x00009888" value="0x25C00000" />
+        <register type="NOA" address="0x00009888" value="0x1BC00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900463" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="577e8e2c-3fa0-4875-8743-3538d585e3b0"
+       chipset="CFLGT3"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="c11af8d1-858b-4f8b-98fb-8d683ba8bda0"
+       chipset="CFLGT3"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-chv.xml b/lib/i915/perf-configs/oa-chv.xml
new file mode 100644
index 00000000..dfc67b96
--- /dev/null
+++ b/lib/i915/perf-configs/oa-chv.xml
@@ -0,0 +1,9757 @@
+<?xml version="1.0"?>
+<metrics version="1562317147" merge_md5="">
+  <set name="Render Metrics Basic Gen8LP"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="9d8a3af5-c02c-4a4a-b947-f1672469e0fb"
+       chipset="CHV"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ  B 1 READ UADD $GpuCoreClocks FDIV 2 FDIV 100 FMUL"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009888" value="0x59800001" />
+        <register type="NOA" address="0x00009888" value="0x285A0006" />
+        <register type="NOA" address="0x00009888" value="0x2C110014" />
+        <register type="NOA" address="0x00009888" value="0x2E110000" />
+        <register type="NOA" address="0x00009888" value="0x2C310014" />
+        <register type="NOA" address="0x00009888" value="0x2E310000" />
+        <register type="NOA" address="0x00009888" value="0x2B8303DF" />
+        <register type="NOA" address="0x00009888" value="0x3580024F" />
+        <register type="NOA" address="0x00009888" value="0x00580888" />
+        <register type="NOA" address="0x00009888" value="0x1E5A0015" />
+        <register type="NOA" address="0x00009888" value="0x205A0014" />
+        <register type="NOA" address="0x00009888" value="0x045A0000" />
+        <register type="NOA" address="0x00009888" value="0x025A0000" />
+        <register type="NOA" address="0x00009888" value="0x02180500" />
+        <register type="NOA" address="0x00009888" value="0x00190555" />
+        <register type="NOA" address="0x00009888" value="0x021D0500" />
+        <register type="NOA" address="0x00009888" value="0x021F0A00" />
+        <register type="NOA" address="0x00009888" value="0x00380444" />
+        <register type="NOA" address="0x00009888" value="0x02390500" />
+        <register type="NOA" address="0x00009888" value="0x003A0666" />
+        <register type="NOA" address="0x00009888" value="0x00100111" />
+        <register type="NOA" address="0x00009888" value="0x06110030" />
+        <register type="NOA" address="0x00009888" value="0x0A110031" />
+        <register type="NOA" address="0x00009888" value="0x0E110046" />
+        <register type="NOA" address="0x00009888" value="0x04110000" />
+        <register type="NOA" address="0x00009888" value="0x00110000" />
+        <register type="NOA" address="0x00009888" value="0x00130111" />
+        <register type="NOA" address="0x00009888" value="0x00300444" />
+        <register type="NOA" address="0x00009888" value="0x08310030" />
+        <register type="NOA" address="0x00009888" value="0x0C310031" />
+        <register type="NOA" address="0x00009888" value="0x10310046" />
+        <register type="NOA" address="0x00009888" value="0x04310000" />
+        <register type="NOA" address="0x00009888" value="0x00310000" />
+        <register type="NOA" address="0x00009888" value="0x00330444" />
+        <register type="NOA" address="0x00009888" value="0x038A0A00" />
+        <register type="NOA" address="0x00009888" value="0x018B0FFF" />
+        <register type="NOA" address="0x00009888" value="0x038B0A00" />
+        <register type="NOA" address="0x00009888" value="0x01855000" />
+        <register type="NOA" address="0x00009888" value="0x03850055" />
+        <register type="NOA" address="0x00009888" value="0x13830021" />
+        <register type="NOA" address="0x00009888" value="0x15830020" />
+        <register type="NOA" address="0x00009888" value="0x1783002F" />
+        <register type="NOA" address="0x00009888" value="0x1983002E" />
+        <register type="NOA" address="0x00009888" value="0x1B83002D" />
+        <register type="NOA" address="0x00009888" value="0x1D83002C" />
+        <register type="NOA" address="0x00009888" value="0x05830000" />
+        <register type="NOA" address="0x00009888" value="0x01840555" />
+        <register type="NOA" address="0x00009888" value="0x03840500" />
+        <register type="NOA" address="0x00009888" value="0x23800074" />
+        <register type="NOA" address="0x00009888" value="0x2580007D" />
+        <register type="NOA" address="0x00009888" value="0x05800000" />
+        <register type="NOA" address="0x00009888" value="0x01805000" />
+        <register type="NOA" address="0x00009888" value="0x03800055" />
+        <register type="NOA" address="0x00009888" value="0x01865000" />
+        <register type="NOA" address="0x00009888" value="0x03860055" />
+        <register type="NOA" address="0x00009888" value="0x01875000" />
+        <register type="NOA" address="0x00009888" value="0x03870055" />
+        <register type="NOA" address="0x00009888" value="0x418000AA" />
+        <register type="NOA" address="0x00009888" value="0x4380000A" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x4780000A" />
+        <register type="NOA" address="0x00009888" value="0x49800000" />
+        <register type="NOA" address="0x00009888" value="0x4B800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x55800000" />
+        <register type="NOA" address="0x00009888" value="0x57800000" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen8LP"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="f522a89c-ecd1-4522-8331-3383c54af5f5"
+       chipset="CHV"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 4 READ B 5 READ UADD 64 UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 2 READ B 3 READ UADD 64 UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 0 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Ring Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and Uncore ring."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 128 UMUL"
+             equation="C 2 READ 128 UMUL"
+             underscore_name="gti_ring_throughput"
+             units="bytes"
+             symbol_name="GtiRingThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 0 READ B 1 READ UADD 64 UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read-Only Stall"
+             description="The percentage of time in which GTI Read-Only port has been stalled."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gti_ro_stall"
+             units="percent"
+             symbol_name="GtiRoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read-Write Stall"
+             description="The percentage of time in which GTI Read-Write port has been stalled."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gti_rw_stall"
+             units="percent"
+             symbol_name="GtiRwStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 1 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009888" value="0x59800001" />
+        <register type="NOA" address="0x00009888" value="0x2E5800E0" />
+        <register type="NOA" address="0x00009888" value="0x2E3800E0" />
+        <register type="NOA" address="0x00009888" value="0x3580024F" />
+        <register type="NOA" address="0x00009888" value="0x3D800140" />
+        <register type="NOA" address="0x00009888" value="0x08580042" />
+        <register type="NOA" address="0x00009888" value="0x0C580040" />
+        <register type="NOA" address="0x00009888" value="0x1058004C" />
+        <register type="NOA" address="0x00009888" value="0x1458004B" />
+        <register type="NOA" address="0x00009888" value="0x04580000" />
+        <register type="NOA" address="0x00009888" value="0x00580000" />
+        <register type="NOA" address="0x00009888" value="0x00195555" />
+        <register type="NOA" address="0x00009888" value="0x06380042" />
+        <register type="NOA" address="0x00009888" value="0x0A380040" />
+        <register type="NOA" address="0x00009888" value="0x0E38004C" />
+        <register type="NOA" address="0x00009888" value="0x1238004B" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x00384444" />
+        <register type="NOA" address="0x00009888" value="0x003A5555" />
+        <register type="NOA" address="0x00009888" value="0x018BFFFF" />
+        <register type="NOA" address="0x00009888" value="0x01845555" />
+        <register type="NOA" address="0x00009888" value="0x17800074" />
+        <register type="NOA" address="0x00009888" value="0x1980007D" />
+        <register type="NOA" address="0x00009888" value="0x1B80007C" />
+        <register type="NOA" address="0x00009888" value="0x1D8000B6" />
+        <register type="NOA" address="0x00009888" value="0x1F8000B7" />
+        <register type="NOA" address="0x00009888" value="0x05800000" />
+        <register type="NOA" address="0x00009888" value="0x03800000" />
+        <register type="NOA" address="0x00009888" value="0x418000AA" />
+        <register type="NOA" address="0x00009888" value="0x438000AA" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x47800000" />
+        <register type="NOA" address="0x00009888" value="0x4980012A" />
+        <register type="NOA" address="0x00009888" value="0x4B80012A" />
+        <register type="NOA" address="0x00009888" value="0x4D80012A" />
+        <register type="NOA" address="0x00009888" value="0x4F80012A" />
+        <register type="NOA" address="0x00009888" value="0x518001CE" />
+        <register type="NOA" address="0x00009888" value="0x538001CE" />
+        <register type="NOA" address="0x00009888" value="0x5580000E" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="a9ccc03d-a943-4e6b-9cd6-13e063075927"
+       chipset="CHV"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses UADD UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009888" value="0x59800001" />
+        <register type="NOA" address="0x00009888" value="0x261E0000" />
+        <register type="NOA" address="0x00009888" value="0x281F000F" />
+        <register type="NOA" address="0x00009888" value="0x2817001A" />
+        <register type="NOA" address="0x00009888" value="0x2791001F" />
+        <register type="NOA" address="0x00009888" value="0x27880019" />
+        <register type="NOA" address="0x00009888" value="0x2D890000" />
+        <register type="NOA" address="0x00009888" value="0x278A0007" />
+        <register type="NOA" address="0x00009888" value="0x298D001F" />
+        <register type="NOA" address="0x00009888" value="0x278E0020" />
+        <register type="NOA" address="0x00009888" value="0x2B8F0012" />
+        <register type="NOA" address="0x00009888" value="0x29900000" />
+        <register type="NOA" address="0x00009888" value="0x00184000" />
+        <register type="NOA" address="0x00009888" value="0x02181000" />
+        <register type="NOA" address="0x00009888" value="0x02194000" />
+        <register type="NOA" address="0x00009888" value="0x141E0002" />
+        <register type="NOA" address="0x00009888" value="0x041E0000" />
+        <register type="NOA" address="0x00009888" value="0x001E0000" />
+        <register type="NOA" address="0x00009888" value="0x221F0015" />
+        <register type="NOA" address="0x00009888" value="0x041F0000" />
+        <register type="NOA" address="0x00009888" value="0x001F4000" />
+        <register type="NOA" address="0x00009888" value="0x021F0000" />
+        <register type="NOA" address="0x00009888" value="0x023A8000" />
+        <register type="NOA" address="0x00009888" value="0x0213C000" />
+        <register type="NOA" address="0x00009888" value="0x02164000" />
+        <register type="NOA" address="0x00009888" value="0x24170012" />
+        <register type="NOA" address="0x00009888" value="0x04170000" />
+        <register type="NOA" address="0x00009888" value="0x07910005" />
+        <register type="NOA" address="0x00009888" value="0x05910000" />
+        <register type="NOA" address="0x00009888" value="0x01911500" />
+        <register type="NOA" address="0x00009888" value="0x03910501" />
+        <register type="NOA" address="0x00009888" value="0x0D880002" />
+        <register type="NOA" address="0x00009888" value="0x1D880003" />
+        <register type="NOA" address="0x00009888" value="0x05880000" />
+        <register type="NOA" address="0x00009888" value="0x0B890032" />
+        <register type="NOA" address="0x00009888" value="0x1B890031" />
+        <register type="NOA" address="0x00009888" value="0x05890000" />
+        <register type="NOA" address="0x00009888" value="0x01890040" />
+        <register type="NOA" address="0x00009888" value="0x03890040" />
+        <register type="NOA" address="0x00009888" value="0x098A0000" />
+        <register type="NOA" address="0x00009888" value="0x198A0004" />
+        <register type="NOA" address="0x00009888" value="0x058A0000" />
+        <register type="NOA" address="0x00009888" value="0x018A8050" />
+        <register type="NOA" address="0x00009888" value="0x038A2050" />
+        <register type="NOA" address="0x00009888" value="0x018B95A9" />
+        <register type="NOA" address="0x00009888" value="0x038BE5A9" />
+        <register type="NOA" address="0x00009888" value="0x018C1500" />
+        <register type="NOA" address="0x00009888" value="0x038C0501" />
+        <register type="NOA" address="0x00009888" value="0x178D0015" />
+        <register type="NOA" address="0x00009888" value="0x058D0000" />
+        <register type="NOA" address="0x00009888" value="0x138E0004" />
+        <register type="NOA" address="0x00009888" value="0x218E000C" />
+        <register type="NOA" address="0x00009888" value="0x058E0000" />
+        <register type="NOA" address="0x00009888" value="0x018E0500" />
+        <register type="NOA" address="0x00009888" value="0x038E0101" />
+        <register type="NOA" address="0x00009888" value="0x0F8F0027" />
+        <register type="NOA" address="0x00009888" value="0x058F0000" />
+        <register type="NOA" address="0x00009888" value="0x018F0000" />
+        <register type="NOA" address="0x00009888" value="0x038F0001" />
+        <register type="NOA" address="0x00009888" value="0x11900013" />
+        <register type="NOA" address="0x00009888" value="0x1F900017" />
+        <register type="NOA" address="0x00009888" value="0x05900000" />
+        <register type="NOA" address="0x00009888" value="0x01900100" />
+        <register type="NOA" address="0x00009888" value="0x03900001" />
+        <register type="NOA" address="0x00009888" value="0x01845555" />
+        <register type="NOA" address="0x00009888" value="0x03845555" />
+        <register type="NOA" address="0x00009888" value="0x418000AA" />
+        <register type="NOA" address="0x00009888" value="0x438000AA" />
+        <register type="NOA" address="0x00009888" value="0x458000AA" />
+        <register type="NOA" address="0x00009888" value="0x478000AA" />
+        <register type="NOA" address="0x00009888" value="0x4980018C" />
+        <register type="NOA" address="0x00009888" value="0x4B80014B" />
+        <register type="NOA" address="0x00009888" value="0x4D800128" />
+        <register type="NOA" address="0x00009888" value="0x4F80012A" />
+        <register type="NOA" address="0x00009888" value="0x51800187" />
+        <register type="NOA" address="0x00009888" value="0x5380014B" />
+        <register type="NOA" address="0x00009888" value="0x55800149" />
+        <register type="NOA" address="0x00009888" value="0x5780010A" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="33af8252-7a51-4aa3-b0ba-1b946f209d7b"
+       chipset="CHV"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ C 0 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader12_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader12AccessStalledOnL3"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ B 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader10_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader10AccessStalledOnL3"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ B 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader11_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader11AccessStalledOnL3"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x105C0232" />
+        <register type="NOA" address="0x00009888" value="0x10580232" />
+        <register type="NOA" address="0x00009888" value="0x10380232" />
+        <register type="NOA" address="0x00009888" value="0x10DC0232" />
+        <register type="NOA" address="0x00009888" value="0x10D80232" />
+        <register type="NOA" address="0x00009888" value="0x10B80232" />
+        <register type="NOA" address="0x00009888" value="0x118E4400" />
+        <register type="NOA" address="0x00009888" value="0x025C6080" />
+        <register type="NOA" address="0x00009888" value="0x045C004B" />
+        <register type="NOA" address="0x00009888" value="0x005C8000" />
+        <register type="NOA" address="0x00009888" value="0x00582080" />
+        <register type="NOA" address="0x00009888" value="0x0258004B" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x04386080" />
+        <register type="NOA" address="0x00009888" value="0x0638404B" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A380000" />
+        <register type="NOA" address="0x00009888" value="0x0C380000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0CDC25C1" />
+        <register type="NOA" address="0x00009888" value="0x0ADCC000" />
+        <register type="NOA" address="0x00009888" value="0x0AD825C1" />
+        <register type="NOA" address="0x00009888" value="0x18DB4000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0001" />
+        <register type="NOA" address="0x00009888" value="0x0E9F8000" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0EB825C1" />
+        <register type="NOA" address="0x00009888" value="0x18B80154" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0D88C000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258BAA05" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C5400" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x098DC000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x098E05C0" />
+        <register type="NOA" address="0x00009888" value="0x058E0000" />
+        <register type="NOA" address="0x00009888" value="0x198F0020" />
+        <register type="NOA" address="0x00009888" value="0x2185AA0A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x19835000" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x19808000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x51800040" />
+        <register type="NOA" address="0x00009888" value="0x43800400" />
+        <register type="NOA" address="0x00009888" value="0x45800800" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800C62" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801042" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x418014A4" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FFF7" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="78f52900-5317-4417-8067-966fbf215a1f"
+       chipset="CHV"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank1 Stalled"
+             description="The percentage of time in which slice1 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_stalled"
+             units="percent"
+             symbol_name="L31Bank1Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice1 L3 Bank0 Stalled"
+             description="The percentage of time in which slice1 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_stalled"
+             units="percent"
+             symbol_name="L31Bank0Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank1 Active"
+             description="The percentage of time in which slice1 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_active"
+             units="percent"
+             symbol_name="L31Bank1Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank0 Active"
+             description="The percentage of time in which slice1 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_active"
+             units="percent"
+             symbol_name="L31Bank0Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x10BF03DA" />
+        <register type="NOA" address="0x00009888" value="0x14BF0001" />
+        <register type="NOA" address="0x00009888" value="0x12980340" />
+        <register type="NOA" address="0x00009888" value="0x12990340" />
+        <register type="NOA" address="0x00009888" value="0x0CBF1187" />
+        <register type="NOA" address="0x00009888" value="0x0EBF1205" />
+        <register type="NOA" address="0x00009888" value="0x00BF0500" />
+        <register type="NOA" address="0x00009888" value="0x02BF042B" />
+        <register type="NOA" address="0x00009888" value="0x04BF002C" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x00DA8000" />
+        <register type="NOA" address="0x00009888" value="0x02DAC000" />
+        <register type="NOA" address="0x00009888" value="0x04DA4000" />
+        <register type="NOA" address="0x00009888" value="0x04983400" />
+        <register type="NOA" address="0x00009888" value="0x10980000" />
+        <register type="NOA" address="0x00009888" value="0x06990034" />
+        <register type="NOA" address="0x00009888" value="0x10990000" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x009D8000" />
+        <register type="NOA" address="0x00009888" value="0x029DC000" />
+        <register type="NOA" address="0x00009888" value="0x049D4000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00BA" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x00B94000" />
+        <register type="NOA" address="0x00009888" value="0x02B95000" />
+        <register type="NOA" address="0x00009888" value="0x04B91000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA4000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x258B800A" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x47800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800060" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="0db4fe4a-2648-4064-bd6a-89c06d0c27b3"
+       chipset="CHV"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x103F03DA" />
+        <register type="NOA" address="0x00009888" value="0x143F0001" />
+        <register type="NOA" address="0x00009888" value="0x12180340" />
+        <register type="NOA" address="0x00009888" value="0x12190340" />
+        <register type="NOA" address="0x00009888" value="0x0C3F1187" />
+        <register type="NOA" address="0x00009888" value="0x0E3F1205" />
+        <register type="NOA" address="0x00009888" value="0x003F0500" />
+        <register type="NOA" address="0x00009888" value="0x023F042B" />
+        <register type="NOA" address="0x00009888" value="0x043F002C" />
+        <register type="NOA" address="0x00009888" value="0x0C5AC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5AC000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x04183400" />
+        <register type="NOA" address="0x00009888" value="0x10180000" />
+        <register type="NOA" address="0x00009888" value="0x06190034" />
+        <register type="NOA" address="0x00009888" value="0x10190000" />
+        <register type="NOA" address="0x00009888" value="0x0C1DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1DC000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x101F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00BA" />
+        <register type="NOA" address="0x00009888" value="0x0C388000" />
+        <register type="NOA" address="0x00009888" value="0x0C395000" />
+        <register type="NOA" address="0x00009888" value="0x0E395000" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04391000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AA800" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B4005" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800000" />
+        <register type="NOA" address="0x00009888" value="0x47800000" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800060" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="0de6539e-33b4-4aee-83c4-9ab45a579b94"
+       chipset="CHV"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank3 Active"
+             description="The percentage of time in which slice1 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank3_active"
+             units="percent"
+             symbol_name="L31Bank3Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 L3 Bank3 Stalled"
+             description="The percentage of time in which slice1 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank3_stalled"
+             units="percent"
+             symbol_name="L31Bank3Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x121B0340" />
+        <register type="NOA" address="0x00009888" value="0x103F0274" />
+        <register type="NOA" address="0x00009888" value="0x123F0000" />
+        <register type="NOA" address="0x00009888" value="0x129B0340" />
+        <register type="NOA" address="0x00009888" value="0x10BF0274" />
+        <register type="NOA" address="0x00009888" value="0x12BF0000" />
+        <register type="NOA" address="0x00009888" value="0x041B3400" />
+        <register type="NOA" address="0x00009888" value="0x101B0000" />
+        <register type="NOA" address="0x00009888" value="0x045C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3D4000" />
+        <register type="NOA" address="0x00009888" value="0x003F0080" />
+        <register type="NOA" address="0x00009888" value="0x023F0793" />
+        <register type="NOA" address="0x00009888" value="0x043F0014" />
+        <register type="NOA" address="0x00009888" value="0x04588000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F002A" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04399000" />
+        <register type="NOA" address="0x00009888" value="0x069B0034" />
+        <register type="NOA" address="0x00009888" value="0x109B0000" />
+        <register type="NOA" address="0x00009888" value="0x06DC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CBD4000" />
+        <register type="NOA" address="0x00009888" value="0x0CBF0981" />
+        <register type="NOA" address="0x00009888" value="0x0EBF0A0F" />
+        <register type="NOA" address="0x00009888" value="0x06D84000" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0CDB4000" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0080" />
+        <register type="NOA" address="0x00009888" value="0x0CB84000" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B8009" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800C00" />
+        <register type="NOA" address="0x00009888" value="0x47800C63" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F8014A5" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800045" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_4"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_4"
+       hw_config_guid="be74c9d6-268f-4d7f-b2e8-8d91d4441883"
+       chipset="CHV"
+       symbol_name="L3_4"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank2 Active"
+             description="The percentage of time in which slice1 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_active"
+             units="percent"
+             symbol_name="L31Bank2Active"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank2 Stalled"
+             description="The percentage of time in which slice1 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_stalled"
+             units="percent"
+             symbol_name="L31Bank2Stalled"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x121A0340" />
+        <register type="NOA" address="0x00009888" value="0x103F0017" />
+        <register type="NOA" address="0x00009888" value="0x123F0020" />
+        <register type="NOA" address="0x00009888" value="0x129A0340" />
+        <register type="NOA" address="0x00009888" value="0x10BF0017" />
+        <register type="NOA" address="0x00009888" value="0x12BF0020" />
+        <register type="NOA" address="0x00009888" value="0x041A3400" />
+        <register type="NOA" address="0x00009888" value="0x101A0000" />
+        <register type="NOA" address="0x00009888" value="0x043B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3E0010" />
+        <register type="NOA" address="0x00009888" value="0x003F0200" />
+        <register type="NOA" address="0x00009888" value="0x023F0113" />
+        <register type="NOA" address="0x00009888" value="0x043F0014" />
+        <register type="NOA" address="0x00009888" value="0x02592000" />
+        <register type="NOA" address="0x00009888" value="0x005A8000" />
+        <register type="NOA" address="0x00009888" value="0x025AC000" />
+        <register type="NOA" address="0x00009888" value="0x045A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x001D8000" />
+        <register type="NOA" address="0x00009888" value="0x021DC000" />
+        <register type="NOA" address="0x00009888" value="0x041D4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F001A" />
+        <register type="NOA" address="0x00009888" value="0x00394000" />
+        <register type="NOA" address="0x00009888" value="0x02395000" />
+        <register type="NOA" address="0x00009888" value="0x04391000" />
+        <register type="NOA" address="0x00009888" value="0x069A0034" />
+        <register type="NOA" address="0x00009888" value="0x109A0000" />
+        <register type="NOA" address="0x00009888" value="0x06BB4000" />
+        <register type="NOA" address="0x00009888" value="0x0ABE0040" />
+        <register type="NOA" address="0x00009888" value="0x0CBF0984" />
+        <register type="NOA" address="0x00009888" value="0x0EBF0A02" />
+        <register type="NOA" address="0x00009888" value="0x02D94000" />
+        <register type="NOA" address="0x00009888" value="0x0CDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDAC000" />
+        <register type="NOA" address="0x00009888" value="0x0C9C0400" />
+        <register type="NOA" address="0x00009888" value="0x0C9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C9E0400" />
+        <register type="NOA" address="0x00009888" value="0x109F02A8" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0040" />
+        <register type="NOA" address="0x00009888" value="0x0CB95000" />
+        <register type="NOA" address="0x00009888" value="0x0EB95000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258B8009" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x198C4000" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185800A" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x1B830154" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x45800800" />
+        <register type="NOA" address="0x00009888" value="0x47800842" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F801084" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800044" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="31bc1ff3-8d09-4497-9d79-59c4f943b502"
+       chipset="CHV"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Rasterizer Input Available"
+             description="The percentage of time in which slice1 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_input_available"
+             units="percent"
+             symbol_name="Rasterizer1InputAvailable"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied))"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Pixel Values Ready"
+             description="The percentage of time in which slice1 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values1_ready"
+             units="percent"
+             symbol_name="PixelValues1Ready"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 PS Output Available"
+             description="The percentage of time in which slice1 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output1_available"
+             units="percent"
+             symbol_name="PSOutput1Available"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice1 Rasterizer Output Ready"
+             description="The percentage of time in which slice1 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_output_ready"
+             units="percent"
+             symbol_name="Rasterizer1OutputReady"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice1 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data1_ready"
+             units="percent"
+             symbol_name="PixelData1Ready"
+             availability="$SliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x143B000E" />
+        <register type="NOA" address="0x00009888" value="0x043C55C0" />
+        <register type="NOA" address="0x00009888" value="0x0A1E0280" />
+        <register type="NOA" address="0x00009888" value="0x0C1E0408" />
+        <register type="NOA" address="0x00009888" value="0x10390000" />
+        <register type="NOA" address="0x00009888" value="0x12397A1F" />
+        <register type="NOA" address="0x00009888" value="0x14BB000E" />
+        <register type="NOA" address="0x00009888" value="0x04BC5000" />
+        <register type="NOA" address="0x00009888" value="0x0A9E0296" />
+        <register type="NOA" address="0x00009888" value="0x0C9E0008" />
+        <register type="NOA" address="0x00009888" value="0x10B90000" />
+        <register type="NOA" address="0x00009888" value="0x12B97A1F" />
+        <register type="NOA" address="0x00009888" value="0x063B0042" />
+        <register type="NOA" address="0x00009888" value="0x103B0000" />
+        <register type="NOA" address="0x00009888" value="0x083C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A3E0040" />
+        <register type="NOA" address="0x00009888" value="0x043F8000" />
+        <register type="NOA" address="0x00009888" value="0x02594000" />
+        <register type="NOA" address="0x00009888" value="0x045A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1C0400" />
+        <register type="NOA" address="0x00009888" value="0x041D8000" />
+        <register type="NOA" address="0x00009888" value="0x081E02C0" />
+        <register type="NOA" address="0x00009888" value="0x0E1E0000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA800" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0260" />
+        <register type="NOA" address="0x00009888" value="0x101F0014" />
+        <register type="NOA" address="0x00009888" value="0x003905E0" />
+        <register type="NOA" address="0x00009888" value="0x06390BC0" />
+        <register type="NOA" address="0x00009888" value="0x02390018" />
+        <register type="NOA" address="0x00009888" value="0x04394000" />
+        <register type="NOA" address="0x00009888" value="0x04BB0042" />
+        <register type="NOA" address="0x00009888" value="0x10BB0000" />
+        <register type="NOA" address="0x00009888" value="0x02BC05C0" />
+        <register type="NOA" address="0x00009888" value="0x08BC0000" />
+        <register type="NOA" address="0x00009888" value="0x0ABE0004" />
+        <register type="NOA" address="0x00009888" value="0x02BF8000" />
+        <register type="NOA" address="0x00009888" value="0x02D91000" />
+        <register type="NOA" address="0x00009888" value="0x02DA8000" />
+        <register type="NOA" address="0x00009888" value="0x089C8000" />
+        <register type="NOA" address="0x00009888" value="0x029D8000" />
+        <register type="NOA" address="0x00009888" value="0x089E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E9E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E9FA806" />
+        <register type="NOA" address="0x00009888" value="0x109F0142" />
+        <register type="NOA" address="0x00009888" value="0x08B90617" />
+        <register type="NOA" address="0x00009888" value="0x0AB90BE0" />
+        <register type="NOA" address="0x00009888" value="0x02B94000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000C" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x018A8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A2800" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x238B52A0" />
+        <register type="NOA" address="0x00009888" value="0x258B6A95" />
+        <register type="NOA" address="0x00009888" value="0x278B0029" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C1500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0014" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x038D8000" />
+        <register type="NOA" address="0x00009888" value="0x058D2000" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA80" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x01834000" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0184C000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1180C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4D800444" />
+        <register type="NOA" address="0x00009888" value="0x3D800000" />
+        <register type="NOA" address="0x00009888" value="0x4F804000" />
+        <register type="NOA" address="0x00009888" value="0x43801080" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800084" />
+        <register type="NOA" address="0x00009888" value="0x53800044" />
+        <register type="NOA" address="0x00009888" value="0x47801080" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800840" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00006000" />
+        <register type="OA" address="0x00002774" value="0x0000F3FF" />
+        <register type="OA" address="0x00002778" value="0x00001800" />
+        <register type="OA" address="0x0000277C" value="0x0000FCFF" />
+        <register type="OA" address="0x00002780" value="0x00000600" />
+        <register type="OA" address="0x00002784" value="0x0000FF3F" />
+        <register type="OA" address="0x00002788" value="0x00000180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000060" />
+        <register type="OA" address="0x00002794" value="0x0000FFF3" />
+        <register type="OA" address="0x00002798" value="0x00000018" />
+        <register type="OA" address="0x0000279C" value="0x0000FFFC" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler_1"
+       hw_config_guid="05450fec-bb5c-4b0a-8995-e03631168a34"
+       chipset="CHV"
+       symbol_name="Sampler_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Slice1 Subslice0 Input Available"
+             description="The percentage of time in which slice1 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_input_available"
+             units="percent"
+             symbol_name="Sampler10InputAvailable"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice1 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler12_output_ready"
+             units="percent"
+             symbol_name="Sampler12OutputReady"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Subslice1 Input Available"
+             description="The percentage of time in which slice1 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_input_available"
+             units="percent"
+             symbol_name="Sampler11InputAvailable"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice1 Subslice2 Input Available"
+             description="The percentage of time in which slice1 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler12_input_available"
+             units="percent"
+             symbol_name="Sampler12InputAvailable"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice1 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_output_ready"
+             units="percent"
+             symbol_name="Sampler10OutputReady"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Slice1 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_output_ready"
+             units="percent"
+             symbol_name="Sampler11OutputReady"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x18921400" />
+        <register type="NOA" address="0x00009888" value="0x149500AB" />
+        <register type="NOA" address="0x00009888" value="0x18B21400" />
+        <register type="NOA" address="0x00009888" value="0x14B500AB" />
+        <register type="NOA" address="0x00009888" value="0x18D21400" />
+        <register type="NOA" address="0x00009888" value="0x14D500AB" />
+        <register type="NOA" address="0x00009888" value="0x0CDC8000" />
+        <register type="NOA" address="0x00009888" value="0x0EDC4000" />
+        <register type="NOA" address="0x00009888" value="0x02DCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DCC000" />
+        <register type="NOA" address="0x00009888" value="0x1ABD00A0" />
+        <register type="NOA" address="0x00009888" value="0x0ABD8000" />
+        <register type="NOA" address="0x00009888" value="0x0CD88000" />
+        <register type="NOA" address="0x00009888" value="0x0ED84000" />
+        <register type="NOA" address="0x00009888" value="0x04D88000" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0050" />
+        <register type="NOA" address="0x00009888" value="0x04DB8000" />
+        <register type="NOA" address="0x00009888" value="0x06DB8000" />
+        <register type="NOA" address="0x00009888" value="0x08DB8000" />
+        <register type="NOA" address="0x00009888" value="0x0ADB4000" />
+        <register type="NOA" address="0x00009888" value="0x109F02A0" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00AA" />
+        <register type="NOA" address="0x00009888" value="0x18B82500" />
+        <register type="NOA" address="0x00009888" value="0x02B88000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB84000" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB98000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x00B98000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x1ABA0200" />
+        <register type="NOA" address="0x00009888" value="0x02BA8000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA8000" />
+        <register type="NOA" address="0x00009888" value="0x04908000" />
+        <register type="NOA" address="0x00009888" value="0x04918000" />
+        <register type="NOA" address="0x00009888" value="0x04927300" />
+        <register type="NOA" address="0x00009888" value="0x10920000" />
+        <register type="NOA" address="0x00009888" value="0x1893000A" />
+        <register type="NOA" address="0x00009888" value="0x0A934000" />
+        <register type="NOA" address="0x00009888" value="0x0A946000" />
+        <register type="NOA" address="0x00009888" value="0x0C959000" />
+        <register type="NOA" address="0x00009888" value="0x0E950098" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x04B04000" />
+        <register type="NOA" address="0x00009888" value="0x04B14000" />
+        <register type="NOA" address="0x00009888" value="0x04B20073" />
+        <register type="NOA" address="0x00009888" value="0x10B20000" />
+        <register type="NOA" address="0x00009888" value="0x04B38000" />
+        <register type="NOA" address="0x00009888" value="0x06B38000" />
+        <register type="NOA" address="0x00009888" value="0x08B34000" />
+        <register type="NOA" address="0x00009888" value="0x04B4C000" />
+        <register type="NOA" address="0x00009888" value="0x02B59890" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x06D04000" />
+        <register type="NOA" address="0x00009888" value="0x06D14000" />
+        <register type="NOA" address="0x00009888" value="0x06D20073" />
+        <register type="NOA" address="0x00009888" value="0x10D20000" />
+        <register type="NOA" address="0x00009888" value="0x18D30020" />
+        <register type="NOA" address="0x00009888" value="0x02D38000" />
+        <register type="NOA" address="0x00009888" value="0x0CD34000" />
+        <register type="NOA" address="0x00009888" value="0x0AD48000" />
+        <register type="NOA" address="0x00009888" value="0x04D42000" />
+        <register type="NOA" address="0x00009888" value="0x0ED59000" />
+        <register type="NOA" address="0x00009888" value="0x00D59800" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x0F88000E" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x258B000A" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8D8000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x1B830150" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D848000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D808000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801021" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800C64" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800C02" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler_2"
+       hw_config_guid="883c8a56-8767-4de8-beec-a99462c6674b"
+       chipset="CHV"
+       symbol_name="Sampler_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x18121400" />
+        <register type="NOA" address="0x00009888" value="0x141500AB" />
+        <register type="NOA" address="0x00009888" value="0x18321400" />
+        <register type="NOA" address="0x00009888" value="0x143500AB" />
+        <register type="NOA" address="0x00009888" value="0x18521400" />
+        <register type="NOA" address="0x00009888" value="0x145500AB" />
+        <register type="NOA" address="0x00009888" value="0x0C5C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5C4000" />
+        <register type="NOA" address="0x00009888" value="0x025CC000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x1A3D00A0" />
+        <register type="NOA" address="0x00009888" value="0x0A3D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C588000" />
+        <register type="NOA" address="0x00009888" value="0x0E584000" />
+        <register type="NOA" address="0x00009888" value="0x04588000" />
+        <register type="NOA" address="0x00009888" value="0x1A5B0050" />
+        <register type="NOA" address="0x00009888" value="0x045B8000" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x101F02A0" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x18382500" />
+        <register type="NOA" address="0x00009888" value="0x02388000" />
+        <register type="NOA" address="0x00009888" value="0x04384000" />
+        <register type="NOA" address="0x00009888" value="0x06384000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C388000" />
+        <register type="NOA" address="0x00009888" value="0x0C398000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x1A3A0200" />
+        <register type="NOA" address="0x00009888" value="0x023A8000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A8000" />
+        <register type="NOA" address="0x00009888" value="0x04108000" />
+        <register type="NOA" address="0x00009888" value="0x04118000" />
+        <register type="NOA" address="0x00009888" value="0x04127300" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x1813000A" />
+        <register type="NOA" address="0x00009888" value="0x0A134000" />
+        <register type="NOA" address="0x00009888" value="0x0A146000" />
+        <register type="NOA" address="0x00009888" value="0x0C159000" />
+        <register type="NOA" address="0x00009888" value="0x0E150098" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04304000" />
+        <register type="NOA" address="0x00009888" value="0x04314000" />
+        <register type="NOA" address="0x00009888" value="0x04320073" />
+        <register type="NOA" address="0x00009888" value="0x10320000" />
+        <register type="NOA" address="0x00009888" value="0x04338000" />
+        <register type="NOA" address="0x00009888" value="0x06338000" />
+        <register type="NOA" address="0x00009888" value="0x08334000" />
+        <register type="NOA" address="0x00009888" value="0x0434C000" />
+        <register type="NOA" address="0x00009888" value="0x02359890" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x06504000" />
+        <register type="NOA" address="0x00009888" value="0x06514000" />
+        <register type="NOA" address="0x00009888" value="0x06520073" />
+        <register type="NOA" address="0x00009888" value="0x10520000" />
+        <register type="NOA" address="0x00009888" value="0x18530020" />
+        <register type="NOA" address="0x00009888" value="0x02538000" />
+        <register type="NOA" address="0x00009888" value="0x0C534000" />
+        <register type="NOA" address="0x00009888" value="0x0A548000" />
+        <register type="NOA" address="0x00009888" value="0x04542000" />
+        <register type="NOA" address="0x00009888" value="0x0E559000" />
+        <register type="NOA" address="0x00009888" value="0x00559800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AA000" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x258B0005" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x2185000A" />
+        <register type="NOA" address="0x00009888" value="0x1B830150" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0D848000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x07844000" />
+        <register type="NOA" address="0x00009888" value="0x1D808000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x17804000" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47801021" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800C64" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x41800C02" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="eb97e523-d9ac-48a9-b7f8-9cc909ddbf14"
+       chipset="CHV"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread11ReadyForDispatch"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread12_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread12ReadyForDispatch"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread10ReadyForDispatch"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread12_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread12ReadyForDispatch"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread10ReadyForDispatch"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread11ReadyForDispatch"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x16154D60" />
+        <register type="NOA" address="0x00009888" value="0x16352E60" />
+        <register type="NOA" address="0x00009888" value="0x16554D60" />
+        <register type="NOA" address="0x00009888" value="0x16950000" />
+        <register type="NOA" address="0x00009888" value="0x16B50000" />
+        <register type="NOA" address="0x00009888" value="0x16D50000" />
+        <register type="NOA" address="0x00009888" value="0x005C8000" />
+        <register type="NOA" address="0x00009888" value="0x045CC000" />
+        <register type="NOA" address="0x00009888" value="0x065C4000" />
+        <register type="NOA" address="0x00009888" value="0x083D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A3D8000" />
+        <register type="NOA" address="0x00009888" value="0x0458C000" />
+        <register type="NOA" address="0x00009888" value="0x025B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E1F00AA" />
+        <register type="NOA" address="0x00009888" value="0x02384000" />
+        <register type="NOA" address="0x00009888" value="0x04388000" />
+        <register type="NOA" address="0x00009888" value="0x06388000" />
+        <register type="NOA" address="0x00009888" value="0x08384000" />
+        <register type="NOA" address="0x00009888" value="0x0A384000" />
+        <register type="NOA" address="0x00009888" value="0x0C384000" />
+        <register type="NOA" address="0x00009888" value="0x00398000" />
+        <register type="NOA" address="0x00009888" value="0x0239A000" />
+        <register type="NOA" address="0x00009888" value="0x0439A000" />
+        <register type="NOA" address="0x00009888" value="0x06392000" />
+        <register type="NOA" address="0x00009888" value="0x043A8000" />
+        <register type="NOA" address="0x00009888" value="0x063A8000" />
+        <register type="NOA" address="0x00009888" value="0x08138000" />
+        <register type="NOA" address="0x00009888" value="0x0A138000" />
+        <register type="NOA" address="0x00009888" value="0x06143000" />
+        <register type="NOA" address="0x00009888" value="0x0415CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x02338000" />
+        <register type="NOA" address="0x00009888" value="0x0C338000" />
+        <register type="NOA" address="0x00009888" value="0x04342000" />
+        <register type="NOA" address="0x00009888" value="0x06344000" />
+        <register type="NOA" address="0x00009888" value="0x0035C700" />
+        <register type="NOA" address="0x00009888" value="0x063500CF" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04538000" />
+        <register type="NOA" address="0x00009888" value="0x06538000" />
+        <register type="NOA" address="0x00009888" value="0x0454C000" />
+        <register type="NOA" address="0x00009888" value="0x0255CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06DC8000" />
+        <register type="NOA" address="0x00009888" value="0x08DC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CDCC000" />
+        <register type="NOA" address="0x00009888" value="0x0EDCC000" />
+        <register type="NOA" address="0x00009888" value="0x1ABD00A8" />
+        <register type="NOA" address="0x00009888" value="0x0CD8C000" />
+        <register type="NOA" address="0x00009888" value="0x0ED84000" />
+        <register type="NOA" address="0x00009888" value="0x0EDB8000" />
+        <register type="NOA" address="0x00009888" value="0x18DB0800" />
+        <register type="NOA" address="0x00009888" value="0x1ADB0254" />
+        <register type="NOA" address="0x00009888" value="0x0E9FAA00" />
+        <register type="NOA" address="0x00009888" value="0x109F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0EB84000" />
+        <register type="NOA" address="0x00009888" value="0x16B84000" />
+        <register type="NOA" address="0x00009888" value="0x18B8156A" />
+        <register type="NOA" address="0x00009888" value="0x06B98000" />
+        <register type="NOA" address="0x00009888" value="0x08B9A000" />
+        <register type="NOA" address="0x00009888" value="0x0AB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0CB9A000" />
+        <register type="NOA" address="0x00009888" value="0x0EB9A000" />
+        <register type="NOA" address="0x00009888" value="0x18BAA000" />
+        <register type="NOA" address="0x00009888" value="0x1ABA0002" />
+        <register type="NOA" address="0x00009888" value="0x16934000" />
+        <register type="NOA" address="0x00009888" value="0x1893000A" />
+        <register type="NOA" address="0x00009888" value="0x0A947000" />
+        <register type="NOA" address="0x00009888" value="0x0C95C5C1" />
+        <register type="NOA" address="0x00009888" value="0x0E9500C3" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x0EB38000" />
+        <register type="NOA" address="0x00009888" value="0x16B30040" />
+        <register type="NOA" address="0x00009888" value="0x18B30020" />
+        <register type="NOA" address="0x00009888" value="0x06B48000" />
+        <register type="NOA" address="0x00009888" value="0x08B41000" />
+        <register type="NOA" address="0x00009888" value="0x0AB48000" />
+        <register type="NOA" address="0x00009888" value="0x06B5C500" />
+        <register type="NOA" address="0x00009888" value="0x08B500C3" />
+        <register type="NOA" address="0x00009888" value="0x0EB5C100" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x16D31500" />
+        <register type="NOA" address="0x00009888" value="0x08D4E000" />
+        <register type="NOA" address="0x00009888" value="0x08D5C100" />
+        <register type="NOA" address="0x00009888" value="0x0AD5C3C5" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x0D88F800" />
+        <register type="NOA" address="0x00009888" value="0x0F88000F" />
+        <register type="NOA" address="0x00009888" value="0x038A8000" />
+        <register type="NOA" address="0x00009888" value="0x058A8000" />
+        <register type="NOA" address="0x00009888" value="0x078A8000" />
+        <register type="NOA" address="0x00009888" value="0x098A8000" />
+        <register type="NOA" address="0x00009888" value="0x0B8A8000" />
+        <register type="NOA" address="0x00009888" value="0x0D8A8000" />
+        <register type="NOA" address="0x00009888" value="0x258BAAA5" />
+        <register type="NOA" address="0x00009888" value="0x278B002A" />
+        <register type="NOA" address="0x00009888" value="0x238B2A80" />
+        <register type="NOA" address="0x00009888" value="0x0F8C4000" />
+        <register type="NOA" address="0x00009888" value="0x178C2000" />
+        <register type="NOA" address="0x00009888" value="0x198C5500" />
+        <register type="NOA" address="0x00009888" value="0x1B8C0015" />
+        <register type="NOA" address="0x00009888" value="0x078D8000" />
+        <register type="NOA" address="0x00009888" value="0x098DA000" />
+        <register type="NOA" address="0x00009888" value="0x0B8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0D8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0F8DA000" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800C42" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45800063" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x47800800" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F8014A4" />
+        <register type="NOA" address="0x00009888" value="0x41801042" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x0000FE7F" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFBF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFF7" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FFF9" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="dff6158e-8409-452c-be76-91c9946330bd"
+       chipset="CHV"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort1"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort0"
+             availability="$SubsliceMask 0x10 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header12_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader12ReadyPort0"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort1"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header12_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader12ReadyPort1"
+             availability="$SubsliceMask 0x20 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL 2 UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort0"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x16150000" />
+        <register type="NOA" address="0x00009888" value="0x16350000" />
+        <register type="NOA" address="0x00009888" value="0x16550000" />
+        <register type="NOA" address="0x00009888" value="0x16952E60" />
+        <register type="NOA" address="0x00009888" value="0x16B54D60" />
+        <register type="NOA" address="0x00009888" value="0x16D52E60" />
+        <register type="NOA" address="0x00009888" value="0x065C8000" />
+        <register type="NOA" address="0x00009888" value="0x085CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A5CC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5C4000" />
+        <register type="NOA" address="0x00009888" value="0x0E3D8000" />
+        <register type="NOA" address="0x00009888" value="0x183DA000" />
+        <register type="NOA" address="0x00009888" value="0x06588000" />
+        <register type="NOA" address="0x00009888" value="0x08588000" />
+        <register type="NOA" address="0x00009888" value="0x0A584000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x185B5800" />
+        <register type="NOA" address="0x00009888" value="0x1A5B000A" />
+        <register type="NOA" address="0x00009888" value="0x0E1FAA00" />
+        <register type="NOA" address="0x00009888" value="0x101F02AA" />
+        <register type="NOA" address="0x00009888" value="0x0E384000" />
+        <register type="NOA" address="0x00009888" value="0x16384000" />
+        <register type="NOA" address="0x00009888" value="0x18382A55" />
+        <register type="NOA" address="0x00009888" value="0x06398000" />
+        <register type="NOA" address="0x00009888" value="0x0839A000" />
+        <register type="NOA" address="0x00009888" value="0x0A39A000" />
+        <register type="NOA" address="0x00009888" value="0x0C39A000" />
+        <register type="NOA" address="0x00009888" value="0x0E39A000" />
+        <register type="NOA" address="0x00009888" value="0x1A3A02A0" />
+        <register type="NOA" address="0x00009888" value="0x0E138000" />
+        <register type="NOA" address="0x00009888" value="0x16130500" />
+        <register type="NOA" address="0x00009888" value="0x06148000" />
+        <register type="NOA" address="0x00009888" value="0x08146000" />
+        <register type="NOA" address="0x00009888" value="0x0615C100" />
+        <register type="NOA" address="0x00009888" value="0x0815C500" />
+        <register type="NOA" address="0x00009888" value="0x0A1500C3" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x16335040" />
+        <register type="NOA" address="0x00009888" value="0x08349000" />
+        <register type="NOA" address="0x00009888" value="0x0A341000" />
+        <register type="NOA" address="0x00009888" value="0x083500C1" />
+        <register type="NOA" address="0x00009888" value="0x0A35C500" />
+        <register type="NOA" address="0x00009888" value="0x0C3500C3" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x1853002A" />
+        <register type="NOA" address="0x00009888" value="0x0A54E000" />
+        <register type="NOA" address="0x00009888" value="0x0C55C500" />
+        <register type="NOA" address="0x00009888" value="0x0E55C1C3" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x00DC8000" />
+        <register type="NOA" address="0x00009888" value="0x02DCC000" />
+        <register type="NOA" address="0x00009888" value="0x04DC4000" />
+        <register type="NOA" address="0x00009888" value="0x04BD8000" />
+        <register type="NOA" address="0x00009888" value="0x06BD8000" />
+        <register type="NOA" address="0x00009888" value="0x02D8C000" />
+        <register type="NOA" address="0x00009888" value="0x02DB8000" />
+        <register type="NOA" address="0x00009888" value="0x04DB4000" />
+        <register type="NOA" address="0x00009888" value="0x06DB4000" />
+        <register type="NOA" address="0x00009888" value="0x08DB8000" />
+        <register type="NOA" address="0x00009888" value="0x0C9FA000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F00AA" />
+        <register type="NOA" address="0x00009888" value="0x02B84000" />
+        <register type="NOA" address="0x00009888" value="0x04B84000" />
+        <register type="NOA" address="0x00009888" value="0x06B84000" />
+        <register type="NOA" address="0x00009888" value="0x08B84000" />
+        <register type="NOA" address="0x00009888" value="0x0AB88000" />
+        <register type="NOA" address="0x00009888" value="0x0CB88000" />
+        <register type="NOA" address="0x00009888" value="0x00B98000" />
+        <register type="NOA" address="0x00009888" value="0x02B9A000" />
+        <register type="NOA" address="0x00009888" value="0x04B9A000" />
+        <register type="NOA" address="0x00009888" value="0x06B92000" />
+        <register type="NOA" address="0x00009888" value="0x0ABA8000" />
+        <register type="NOA" address="0x00009888" value="0x0CBA8000" />
+        <register type="NOA" address="0x00009888" value="0x04938000" />
+        <register type="NOA" address="0x00009888" value="0x06938000" />
+        <register type="NOA" address="0x00009888" value="0x0494C000" />
+        <register type="NOA" address="0x00009888" value="0x0295CFC7" />
+        <register type="NOA" address="0x00009888" value="0x10950000" />
+        <register type="NOA" address="0x00009888" value="0x02B38000" />
+        <register type="NOA" address="0x00009888" value="0x08B38000" />
+        <register type="NOA" address="0x00009888" value="0x04B42000" />
+        <register type="NOA" address="0x00009888" value="0x06B41000" />
+        <register type="NOA" address="0x00009888" value="0x00B5C700" />
+        <register type="NOA" address="0x00009888" value="0x04B500CF" />
+        <register type="NOA" address="0x00009888" value="0x10B50000" />
+        <register type="NOA" address="0x00009888" value="0x0AD38000" />
+        <register type="NOA" address="0x00009888" value="0x0CD38000" />
+        <register type="NOA" address="0x00009888" value="0x06D46000" />
+        <register type="NOA" address="0x00009888" value="0x04D5C700" />
+        <register type="NOA" address="0x00009888" value="0x06D500CF" />
+        <register type="NOA" address="0x00009888" value="0x10D50000" />
+        <register type="NOA" address="0x00009888" value="0x03888000" />
+        <register type="NOA" address="0x00009888" value="0x05888000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x09888000" />
+        <register type="NOA" address="0x00009888" value="0x0B888000" />
+        <register type="NOA" address="0x00009888" value="0x0D880400" />
+        <register type="NOA" address="0x00009888" value="0x0F8A8000" />
+        <register type="NOA" address="0x00009888" value="0x198A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8AAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0002" />
+        <register type="NOA" address="0x00009888" value="0x258B555A" />
+        <register type="NOA" address="0x00009888" value="0x278B0015" />
+        <register type="NOA" address="0x00009888" value="0x238B5500" />
+        <register type="NOA" address="0x00009888" value="0x038C4000" />
+        <register type="NOA" address="0x00009888" value="0x058C4000" />
+        <register type="NOA" address="0x00009888" value="0x078C4000" />
+        <register type="NOA" address="0x00009888" value="0x098C4000" />
+        <register type="NOA" address="0x00009888" value="0x0B8C4000" />
+        <register type="NOA" address="0x00009888" value="0x0D8C4000" />
+        <register type="NOA" address="0x00009888" value="0x018D8000" />
+        <register type="NOA" address="0x00009888" value="0x038DA000" />
+        <register type="NOA" address="0x00009888" value="0x058DA000" />
+        <register type="NOA" address="0x00009888" value="0x078D2000" />
+        <register type="NOA" address="0x00009888" value="0x2185AAAA" />
+        <register type="NOA" address="0x00009888" value="0x2385002A" />
+        <register type="NOA" address="0x00009888" value="0x1F85AA00" />
+        <register type="NOA" address="0x00009888" value="0x0F834000" />
+        <register type="NOA" address="0x00009888" value="0x19835400" />
+        <register type="NOA" address="0x00009888" value="0x1B830155" />
+        <register type="NOA" address="0x00009888" value="0x03834000" />
+        <register type="NOA" address="0x00009888" value="0x05834000" />
+        <register type="NOA" address="0x00009888" value="0x07834000" />
+        <register type="NOA" address="0x00009888" value="0x09834000" />
+        <register type="NOA" address="0x00009888" value="0x0B834000" />
+        <register type="NOA" address="0x00009888" value="0x0D834000" />
+        <register type="NOA" address="0x00009888" value="0x0784C000" />
+        <register type="NOA" address="0x00009888" value="0x0984C000" />
+        <register type="NOA" address="0x00009888" value="0x0B84C000" />
+        <register type="NOA" address="0x00009888" value="0x0D84C000" />
+        <register type="NOA" address="0x00009888" value="0x0F84C000" />
+        <register type="NOA" address="0x00009888" value="0x01848000" />
+        <register type="NOA" address="0x00009888" value="0x0384C000" />
+        <register type="NOA" address="0x00009888" value="0x0584C000" />
+        <register type="NOA" address="0x00009888" value="0x1780C000" />
+        <register type="NOA" address="0x00009888" value="0x1980C000" />
+        <register type="NOA" address="0x00009888" value="0x1B80C000" />
+        <register type="NOA" address="0x00009888" value="0x1D80C000" />
+        <register type="NOA" address="0x00009888" value="0x1F80C000" />
+        <register type="NOA" address="0x00009888" value="0x11808000" />
+        <register type="NOA" address="0x00009888" value="0x1380C000" />
+        <register type="NOA" address="0x00009888" value="0x1580C000" />
+        <register type="NOA" address="0x00009888" value="0x4F800000" />
+        <register type="NOA" address="0x00009888" value="0x43800882" />
+        <register type="NOA" address="0x00009888" value="0x51800000" />
+        <register type="NOA" address="0x00009888" value="0x45801082" />
+        <register type="NOA" address="0x00009888" value="0x53800000" />
+        <register type="NOA" address="0x00009888" value="0x478014A5" />
+        <register type="NOA" address="0x00009888" value="0x21800000" />
+        <register type="NOA" address="0x00009888" value="0x31800000" />
+        <register type="NOA" address="0x00009888" value="0x4D800000" />
+        <register type="NOA" address="0x00009888" value="0x3F800002" />
+        <register type="NOA" address="0x00009888" value="0x41800C62" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x0000FE7F" />
+        <register type="OA" address="0x00002780" value="0x00000000" />
+        <register type="OA" address="0x00002784" value="0x0000FF9F" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFFB" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FFFD" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen8LP"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="4a534b07-cba3-414d-8d60-874830e883aa"
+       chipset="CHV"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009888" value="0x59800001" />
+        <register type="NOA" address="0x00009888" value="0x338B0000" />
+        <register type="NOA" address="0x00009888" value="0x258B0066" />
+        <register type="NOA" address="0x00009888" value="0x058B0000" />
+        <register type="NOA" address="0x00009888" value="0x038B0000" />
+        <register type="NOA" address="0x00009888" value="0x03844000" />
+        <register type="NOA" address="0x00009888" value="0x47800080" />
+        <register type="NOA" address="0x00009888" value="0x57800000" />
+        <register type="NOA" address="0x001823A4" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x59800000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-cnl.xml b/lib/i915/perf-configs/oa-cnl.xml
new file mode 100644
index 00000000..182d6c4a
--- /dev/null
+++ b/lib/i915/perf-configs/oa-cnl.xml
@@ -0,0 +1,10411 @@
+<?xml version="1.0"?>
+<metrics version="1553959724" merge_md5="">
+  <set name="Render Metrics Basic Gen10"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="2d975e19-7130-41d2-b06f-79d74f91e7c8"
+       chipset="CNL"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 2 READ C 3 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="$SliceMask 1 AND B 4 READ UMUL $SliceMask 1 >> 1 AND B 5 READ UMUL UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="64 $SamplerL1Misses UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler00 Busy"
+             description="The percentage of time in which Slice0 Sampler0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_busy"
+             units="percent"
+             symbol_name="Sampler00Busy"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler10 Busy"
+             description="The percentage of time in which Slice1 Sampler0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_busy"
+             units="percent"
+             symbol_name="Sampler10Busy"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$SubsliceMask 1 AND $Sampler00Busy FMUL $SubsliceMask 3 >> 1 AND $Sampler10Busy FMUL FADD $SubsliceMask 1 AND $SubsliceMask 3 >> 1 AND FADD FDIV"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Sampler00 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Slice0 Sampler0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler00_bottleneck"
+             units="percent"
+             symbol_name="Sampler00Bottleneck"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 6 READ UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="128  B 6 READ UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Sampler10 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Slice1 Sampler0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler10_bottleneck"
+             units="percent"
+             symbol_name="Sampler10Bottleneck"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$SubsliceMask 1 AND $Sampler00Bottleneck FMUL $SubsliceMask 3 >> 1 AND $Sampler10Bottleneck FMUL FADD $SubsliceMask 1 AND $SubsliceMask 3 >> 1 AND FADD FDIV"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 0 READ C 1 READ UADD 128 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 7 READ UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x146C0008" />
+        <register type="NOA" address="0x00009888" value="0x18110014" />
+        <register type="NOA" address="0x00009888" value="0x14EC0008" />
+        <register type="NOA" address="0x00009888" value="0x18910014" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0054" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0444" />
+        <register type="NOA" address="0x00009888" value="0x02738000" />
+        <register type="NOA" address="0x00009888" value="0x0473E000" />
+        <register type="NOA" address="0x00009888" value="0x04742000" />
+        <register type="NOA" address="0x00009888" value="0x0C742000" />
+        <register type="NOA" address="0x00009888" value="0x04752000" />
+        <register type="NOA" address="0x00009888" value="0x0C752000" />
+        <register type="NOA" address="0x00009888" value="0x0C760800" />
+        <register type="NOA" address="0x00009888" value="0x0E760800" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E778000" />
+        <register type="NOA" address="0x00009888" value="0x1477C000" />
+        <register type="NOA" address="0x00009888" value="0x167702A0" />
+        <register type="NOA" address="0x00009888" value="0x00194000" />
+        <register type="NOA" address="0x00009888" value="0x1A190020" />
+        <register type="NOA" address="0x00009888" value="0x00110060" />
+        <register type="NOA" address="0x00009888" value="0x08110061" />
+        <register type="NOA" address="0x00009888" value="0x1E110000" />
+        <register type="NOA" address="0x00009888" value="0x10110000" />
+        <register type="NOA" address="0x00009888" value="0x18144000" />
+        <register type="NOA" address="0x00009888" value="0x1C140400" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5400" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1AEC0000" />
+        <register type="NOA" address="0x00009888" value="0x04F38000" />
+        <register type="NOA" address="0x00009888" value="0x0AF48000" />
+        <register type="NOA" address="0x00009888" value="0x0CF48000" />
+        <register type="NOA" address="0x00009888" value="0x0AF58000" />
+        <register type="NOA" address="0x00009888" value="0x0CF58000" />
+        <register type="NOA" address="0x00009888" value="0x0EF62200" />
+        <register type="NOA" address="0x00009888" value="0x0EF7C000" />
+        <register type="NOA" address="0x00009888" value="0x16F70230" />
+        <register type="NOA" address="0x00009888" value="0x0E994000" />
+        <register type="NOA" address="0x00009888" value="0x1A990080" />
+        <register type="NOA" address="0x00009888" value="0x06916000" />
+        <register type="NOA" address="0x00009888" value="0x08916100" />
+        <register type="NOA" address="0x00009888" value="0x1E910000" />
+        <register type="NOA" address="0x00009888" value="0x1C941100" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x0B086F4F" />
+        <register type="NOA" address="0x00009888" value="0x0D080001" />
+        <register type="NOA" address="0x00009888" value="0x1D073800" />
+        <register type="NOA" address="0x00009888" value="0x1F070140" />
+        <register type="NOA" address="0x00009888" value="0x09081E93" />
+        <register type="NOA" address="0x00009888" value="0x01083160" />
+        <register type="NOA" address="0x00009888" value="0x030801A6" />
+        <register type="NOA" address="0x00009888" value="0x11080000" />
+        <register type="NOA" address="0x00009888" value="0x0F080000" />
+        <register type="NOA" address="0x00009888" value="0x0D095000" />
+        <register type="NOA" address="0x00009888" value="0x0F095000" />
+        <register type="NOA" address="0x00009888" value="0x01094000" />
+        <register type="NOA" address="0x00009888" value="0x03095000" />
+        <register type="NOA" address="0x00009888" value="0x05091000" />
+        <register type="NOA" address="0x00009888" value="0x13040154" />
+        <register type="NOA" address="0x00009888" value="0x09044000" />
+        <register type="NOA" address="0x00009888" value="0x0B045000" />
+        <register type="NOA" address="0x00009888" value="0x0D049000" />
+        <register type="NOA" address="0x00009888" value="0x0F042000" />
+        <register type="NOA" address="0x00009888" value="0x0507E700" />
+        <register type="NOA" address="0x00009888" value="0x070700D7" />
+        <register type="NOA" address="0x00009888" value="0x25070000" />
+        <register type="NOA" address="0x00009888" value="0x1B070000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2100C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x29004000" />
+        <register type="NOA" address="0x00009888" value="0x2B004000" />
+        <register type="NOA" address="0x00009888" value="0x2D004000" />
+        <register type="NOA" address="0x00009888" value="0x2F004000" />
+        <register type="NOA" address="0x00009888" value="0x13004000" />
+        <register type="NOA" address="0x00009888" value="0x15004000" />
+        <register type="NOA" address="0x00009888" value="0x17004000" />
+        <register type="NOA" address="0x00009888" value="0x19004000" />
+        <register type="NOA" address="0x00009888" value="0x1B004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47003331" />
+        <register type="NOA" address="0x00009888" value="0x390018C1" />
+        <register type="NOA" address="0x00009888" value="0x49000333" />
+        <register type="NOA" address="0x00009888" value="0x3D000407" />
+        <register type="NOA" address="0x00009888" value="0x4B001101" />
+        <register type="NOA" address="0x00009888" value="0x3F000120" />
+        <register type="NOA" address="0x00009888" value="0x4D003333" />
+        <register type="NOA" address="0x00009888" value="0x410018C6" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000006" />
+        <register type="NOA" address="0x00009888" value="0x3B001CC6" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x40800000" />
+        <register type="OA" address="0x000027A0" value="0x00000202" />
+        <register type="OA" address="0x000027A4" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen10"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="eed14f91-5f03-4e3a-8281-ac38030ac573"
+       chipset="CNL"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$EuSubslicesTotalCount $SubsliceMask 1 AND C 2 READ FMUL $SubsliceMask 3 >> 1 AND C 3 READ FMUL FADD FMUL $SubsliceMask 1 AND $SubsliceMask 3 >> 1 AND FADD FDIV 64 UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             availability="$SubsliceMask 9 AND "
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SubsliceMask 1 AND B 5 READ UMUL $SubsliceMask 1 >> 1 AND B 6 READ UMUL UADD $SubsliceMask 2 >> 1 AND B 7 READ UMUL UADD $SubsliceMask 3 >> 1 AND C 0 READ UMUL UADD $SubsliceMask 4 >> 1 AND C 1 READ UMUL UADD 64 UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 6 READ UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$EuSubslicesTotalCount $SubsliceMask 1 AND C 4 READ FMUL $SubsliceMask 3 >> 1 AND C 5 READ FMUL FADD FMUL $SubsliceMask 1 AND $SubsliceMask 3 >> 1 AND FADD FDIV 64 UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SubsliceMask 1 AND B 0 READ UMUL $SubsliceMask 1 >> 1 AND B 1 READ UMUL UADD $SubsliceMask 2 >> 1 AND B 2 READ UMUL UADD $SubsliceMask 3 >> 1 AND B 3 READ UMUL UADD $SubsliceMask 4 >> 1 AND B 4 READ UMUL UADD 64 UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 13 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 7 READ UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x121A0000" />
+        <register type="NOA" address="0x00009888" value="0x101A0007" />
+        <register type="NOA" address="0x00009888" value="0x123A0000" />
+        <register type="NOA" address="0x00009888" value="0x129A0000" />
+        <register type="NOA" address="0x00009888" value="0x109A0007" />
+        <register type="NOA" address="0x00009888" value="0x12BA0000" />
+        <register type="NOA" address="0x00009888" value="0x125A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0140" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0005" />
+        <register type="NOA" address="0x00009888" value="0x186C0880" />
+        <register type="NOA" address="0x00009888" value="0x04736000" />
+        <register type="NOA" address="0x00009888" value="0x0673C000" />
+        <register type="NOA" address="0x00009888" value="0x00734000" />
+        <register type="NOA" address="0x00009888" value="0x02731000" />
+        <register type="NOA" address="0x00009888" value="0x0474A000" />
+        <register type="NOA" address="0x00009888" value="0x0E748000" />
+        <register type="NOA" address="0x00009888" value="0x06748000" />
+        <register type="NOA" address="0x00009888" value="0x0475A000" />
+        <register type="NOA" address="0x00009888" value="0x0E758000" />
+        <register type="NOA" address="0x00009888" value="0x06758000" />
+        <register type="NOA" address="0x00009888" value="0x0C762800" />
+        <register type="NOA" address="0x00009888" value="0x10760002" />
+        <register type="NOA" address="0x00009888" value="0x0E760002" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E774000" />
+        <register type="NOA" address="0x00009888" value="0x14774000" />
+        <register type="NOA" address="0x00009888" value="0x167797A0" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x0277C000" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x0677C000" />
+        <register type="NOA" address="0x00009888" value="0x08778000" />
+        <register type="NOA" address="0x00009888" value="0x0A7B0A00" />
+        <register type="NOA" address="0x00009888" value="0x0C7B0028" />
+        <register type="NOA" address="0x00009888" value="0x0E7C8000" />
+        <register type="NOA" address="0x00009888" value="0x147C0C00" />
+        <register type="NOA" address="0x00009888" value="0x167C0038" />
+        <register type="NOA" address="0x00009888" value="0x1C7D2000" />
+        <register type="NOA" address="0x00009888" value="0x1E7D0080" />
+        <register type="NOA" address="0x00009888" value="0x0019C000" />
+        <register type="NOA" address="0x00009888" value="0x1A191800" />
+        <register type="NOA" address="0x00009888" value="0x0219C000" />
+        <register type="NOA" address="0x00009888" value="0x0619C000" />
+        <register type="NOA" address="0x00009888" value="0x001A2E52" />
+        <register type="NOA" address="0x00009888" value="0x0A1A2880" />
+        <register type="NOA" address="0x00009888" value="0x021A2D80" />
+        <register type="NOA" address="0x00009888" value="0x0E39C000" />
+        <register type="NOA" address="0x00009888" value="0x1A396000" />
+        <register type="NOA" address="0x00009888" value="0x063A2900" />
+        <register type="NOA" address="0x00009888" value="0x0C3A0051" />
+        <register type="NOA" address="0x00009888" value="0x003A0000" />
+        <register type="NOA" address="0x00009888" value="0x0CF48000" />
+        <register type="NOA" address="0x00009888" value="0x12F40400" />
+        <register type="NOA" address="0x00009888" value="0x06F42000" />
+        <register type="NOA" address="0x00009888" value="0x08F42000" />
+        <register type="NOA" address="0x00009888" value="0x0CF58000" />
+        <register type="NOA" address="0x00009888" value="0x14F50020" />
+        <register type="NOA" address="0x00009888" value="0x06F52000" />
+        <register type="NOA" address="0x00009888" value="0x08F52000" />
+        <register type="NOA" address="0x00009888" value="0x0EF62008" />
+        <register type="NOA" address="0x00009888" value="0x10F60080" />
+        <register type="NOA" address="0x00009888" value="0x0CF68000" />
+        <register type="NOA" address="0x00009888" value="0x16F7C070" />
+        <register type="NOA" address="0x00009888" value="0x18F70001" />
+        <register type="NOA" address="0x00009888" value="0x04F7C000" />
+        <register type="NOA" address="0x00009888" value="0x08F7C000" />
+        <register type="NOA" address="0x00009888" value="0x0AFB8000" />
+        <register type="NOA" address="0x00009888" value="0x0CFB0200" />
+        <register type="NOA" address="0x00009888" value="0x14FC8000" />
+        <register type="NOA" address="0x00009888" value="0x16FC0200" />
+        <register type="NOA" address="0x00009888" value="0x1EFD2008" />
+        <register type="NOA" address="0x00009888" value="0x1A990180" />
+        <register type="NOA" address="0x00009888" value="0x1C99000C" />
+        <register type="NOA" address="0x00009888" value="0x0499C000" />
+        <register type="NOA" address="0x00009888" value="0x0899C000" />
+        <register type="NOA" address="0x00009888" value="0x089A2900" />
+        <register type="NOA" address="0x00009888" value="0x0E9A0051" />
+        <register type="NOA" address="0x00009888" value="0x029A005C" />
+        <register type="NOA" address="0x00009888" value="0x049A005B" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x1AB90600" />
+        <register type="NOA" address="0x00009888" value="0x1CB90030" />
+        <register type="NOA" address="0x00009888" value="0x0ABA0052" />
+        <register type="NOA" address="0x00009888" value="0x0EBA2880" />
+        <register type="NOA" address="0x00009888" value="0x00BA0000" />
+        <register type="NOA" address="0x00009888" value="0x1A590060" />
+        <register type="NOA" address="0x00009888" value="0x1C590003" />
+        <register type="NOA" address="0x00009888" value="0x085A0052" />
+        <register type="NOA" address="0x00009888" value="0x0C5A2880" />
+        <register type="NOA" address="0x00009888" value="0x005A0000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x1D073800" />
+        <register type="NOA" address="0x00009888" value="0x1F070140" />
+        <register type="NOA" address="0x00009888" value="0x0D048000" />
+        <register type="NOA" address="0x00009888" value="0x0F042000" />
+        <register type="NOA" address="0x00009888" value="0x0507E700" />
+        <register type="NOA" address="0x00009888" value="0x070700D7" />
+        <register type="NOA" address="0x00009888" value="0x25070000" />
+        <register type="NOA" address="0x00009888" value="0x1B070000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2100C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x1B004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47001011" />
+        <register type="NOA" address="0x00009888" value="0x39000021" />
+        <register type="NOA" address="0x00009888" value="0x49001330" />
+        <register type="NOA" address="0x00009888" value="0x3D001026" />
+        <register type="NOA" address="0x00009888" value="0x4B001000" />
+        <register type="NOA" address="0x00009888" value="0x3F000400" />
+        <register type="NOA" address="0x00009888" value="0x4D000001" />
+        <register type="NOA" address="0x00009888" value="0x41000081" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000000" />
+        <register type="NOA" address="0x00009888" value="0x3B001801" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen10"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="0666ccac-f5aa-4dc2-aa12-c6e058f383f3"
+       chipset="CNL"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x0A7003E0" />
+        <register type="NOA" address="0x00009888" value="0x0A710000" />
+        <register type="NOA" address="0x00009888" value="0x1017001E" />
+        <register type="NOA" address="0x00009888" value="0x06700015" />
+        <register type="NOA" address="0x00009888" value="0x00700000" />
+        <register type="NOA" address="0x00009888" value="0x06710800" />
+        <register type="NOA" address="0x00009888" value="0x00710000" />
+        <register type="NOA" address="0x00009888" value="0x0C746000" />
+        <register type="NOA" address="0x00009888" value="0x0C75A000" />
+        <register type="NOA" address="0x00009888" value="0x0E754000" />
+        <register type="NOA" address="0x00009888" value="0x0E762800" />
+        <register type="NOA" address="0x00009888" value="0x10760002" />
+        <register type="NOA" address="0x00009888" value="0x1477C000" />
+        <register type="NOA" address="0x00009888" value="0x16770330" />
+        <register type="NOA" address="0x00009888" value="0x1A190040" />
+        <register type="NOA" address="0x00009888" value="0x08170001" />
+        <register type="NOA" address="0x00009888" value="0x1C170000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x01160031" />
+        <register type="NOA" address="0x00009888" value="0x11177C00" />
+        <register type="NOA" address="0x00009888" value="0x11187C00" />
+        <register type="NOA" address="0x00009888" value="0x05190000" />
+        <register type="NOA" address="0x00009888" value="0x110E7800" />
+        <register type="NOA" address="0x00009888" value="0x130F0000" />
+        <register type="NOA" address="0x00009888" value="0x15120000" />
+        <register type="NOA" address="0x00009888" value="0x11130019" />
+        <register type="NOA" address="0x00009888" value="0x0F160C80" />
+        <register type="NOA" address="0x00009888" value="0x0B160000" />
+        <register type="NOA" address="0x00009888" value="0x07162000" />
+        <register type="NOA" address="0x00009888" value="0x03168000" />
+        <register type="NOA" address="0x00009888" value="0x071705C0" />
+        <register type="NOA" address="0x00009888" value="0x011704C0" />
+        <register type="NOA" address="0x00009888" value="0x05170000" />
+        <register type="NOA" address="0x00009888" value="0x0B180015" />
+        <register type="NOA" address="0x00009888" value="0x01185000" />
+        <register type="NOA" address="0x00009888" value="0x07185000" />
+        <register type="NOA" address="0x00009888" value="0x0D185000" />
+        <register type="NOA" address="0x00009888" value="0x0F185000" />
+        <register type="NOA" address="0x00009888" value="0x03186000" />
+        <register type="NOA" address="0x00009888" value="0x05185000" />
+        <register type="NOA" address="0x00009888" value="0x03190022" />
+        <register type="NOA" address="0x00009888" value="0x0F190000" />
+        <register type="NOA" address="0x00009888" value="0x09190000" />
+        <register type="NOA" address="0x00009888" value="0x0D0E8023" />
+        <register type="NOA" address="0x00009888" value="0x030E1100" />
+        <register type="NOA" address="0x00009888" value="0x050E4000" />
+        <register type="NOA" address="0x00009888" value="0x0D0F0180" />
+        <register type="NOA" address="0x00009888" value="0x050F0001" />
+        <register type="NOA" address="0x00009888" value="0x010F0000" />
+        <register type="NOA" address="0x00009888" value="0x1B100054" />
+        <register type="NOA" address="0x00009888" value="0x07104000" />
+        <register type="NOA" address="0x00009888" value="0x09104000" />
+        <register type="NOA" address="0x00009888" value="0x0B104000" />
+        <register type="NOA" address="0x00009888" value="0x0D104000" />
+        <register type="NOA" address="0x00009888" value="0x1B114000" />
+        <register type="NOA" address="0x00009888" value="0x1D110006" />
+        <register type="NOA" address="0x00009888" value="0x07118000" />
+        <register type="NOA" address="0x00009888" value="0x09118000" />
+        <register type="NOA" address="0x00009888" value="0x0B114000" />
+        <register type="NOA" address="0x00009888" value="0x0D114000" />
+        <register type="NOA" address="0x00009888" value="0x05127100" />
+        <register type="NOA" address="0x00009888" value="0x07120073" />
+        <register type="NOA" address="0x00009888" value="0x21120001" />
+        <register type="NOA" address="0x00009888" value="0x1F120000" />
+        <register type="NOA" address="0x00009888" value="0x0F130002" />
+        <register type="NOA" address="0x00009888" value="0x01130000" />
+        <register type="NOA" address="0x00009888" value="0x0B144000" />
+        <register type="NOA" address="0x00009888" value="0x0F144025" />
+        <register type="NOA" address="0x00009888" value="0x11140025" />
+        <register type="NOA" address="0x00009888" value="0x0D145200" />
+        <register type="NOA" address="0x00009888" value="0x11158000" />
+        <register type="NOA" address="0x00009888" value="0x1F158080" />
+        <register type="NOA" address="0x00009888" value="0x13158000" />
+        <register type="NOA" address="0x00009888" value="0x0109A000" />
+        <register type="NOA" address="0x00009888" value="0x0709A000" />
+        <register type="NOA" address="0x00009888" value="0x0B092000" />
+        <register type="NOA" address="0x00009888" value="0x0D09A000" />
+        <register type="NOA" address="0x00009888" value="0x0F09A000" />
+        <register type="NOA" address="0x00009888" value="0x0309A000" />
+        <register type="NOA" address="0x00009888" value="0x0509A000" />
+        <register type="NOA" address="0x00009888" value="0x010BC000" />
+        <register type="NOA" address="0x00009888" value="0x070BC000" />
+        <register type="NOA" address="0x00009888" value="0x0B0B4000" />
+        <register type="NOA" address="0x00009888" value="0x0D0BC000" />
+        <register type="NOA" address="0x00009888" value="0x0F0BC000" />
+        <register type="NOA" address="0x00009888" value="0x030BC000" />
+        <register type="NOA" address="0x00009888" value="0x050BC000" />
+        <register type="NOA" address="0x00009888" value="0x09045000" />
+        <register type="NOA" address="0x00009888" value="0x0F045000" />
+        <register type="NOA" address="0x00009888" value="0x11044000" />
+        <register type="NOA" address="0x00009888" value="0x13040154" />
+        <register type="NOA" address="0x00009888" value="0x0B045000" />
+        <register type="NOA" address="0x00009888" value="0x0D045000" />
+        <register type="NOA" address="0x00009888" value="0x11004000" />
+        <register type="NOA" address="0x00009888" value="0x1F004000" />
+        <register type="NOA" address="0x00009888" value="0x2100C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x25004000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x29004000" />
+        <register type="NOA" address="0x00009888" value="0x2B004000" />
+        <register type="NOA" address="0x00009888" value="0x2D004000" />
+        <register type="NOA" address="0x00009888" value="0x2F004000" />
+        <register type="NOA" address="0x00009888" value="0x13004000" />
+        <register type="NOA" address="0x00009888" value="0x15004000" />
+        <register type="NOA" address="0x00009888" value="0x17004000" />
+        <register type="NOA" address="0x00009888" value="0x19004000" />
+        <register type="NOA" address="0x00009888" value="0x1B004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47001111" />
+        <register type="NOA" address="0x00009888" value="0x39001022" />
+        <register type="NOA" address="0x00009888" value="0x49001111" />
+        <register type="NOA" address="0x00009888" value="0x3D000021" />
+        <register type="NOA" address="0x00009888" value="0x4B000100" />
+        <register type="NOA" address="0x00009888" value="0x3F0018A5" />
+        <register type="NOA" address="0x00009888" value="0x4D001111" />
+        <register type="NOA" address="0x00009888" value="0x41000001" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000002" />
+        <register type="NOA" address="0x00009888" value="0x3B000401" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen10"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="3500dcfd-837b-4ec8-b5cf-fe58b966263f"
+       chipset="CNL"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads UADD $GtiL3Bank2Reads UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x17066860" />
+        <register type="NOA" address="0x00009888" value="0x15070017" />
+        <register type="NOA" address="0x00009888" value="0x1F072920" />
+        <register type="NOA" address="0x00009888" value="0x1B038000" />
+        <register type="NOA" address="0x00009888" value="0x0D038000" />
+        <register type="NOA" address="0x00009888" value="0x0F034000" />
+        <register type="NOA" address="0x00009888" value="0x0F063180" />
+        <register type="NOA" address="0x00009888" value="0x01063100" />
+        <register type="NOA" address="0x00009888" value="0x0306006B" />
+        <register type="NOA" address="0x00009888" value="0x05060000" />
+        <register type="NOA" address="0x00009888" value="0x11080100" />
+        <register type="NOA" address="0x00009888" value="0x0D085000" />
+        <register type="NOA" address="0x00009888" value="0x0F094000" />
+        <register type="NOA" address="0x00009888" value="0x01094000" />
+        <register type="NOA" address="0x00009888" value="0x03091000" />
+        <register type="NOA" address="0x00009888" value="0x09046000" />
+        <register type="NOA" address="0x00009888" value="0x0F04A000" />
+        <register type="NOA" address="0x00009888" value="0x1104A800" />
+        <register type="NOA" address="0x00009888" value="0x130401AA" />
+        <register type="NOA" address="0x00009888" value="0x0B041000" />
+        <register type="NOA" address="0x00009888" value="0x010700E0" />
+        <register type="NOA" address="0x00009888" value="0x0707E153" />
+        <register type="NOA" address="0x00009888" value="0x0907E3E2" />
+        <register type="NOA" address="0x00009888" value="0x0B07E5E4" />
+        <register type="NOA" address="0x00009888" value="0x0D07E7E6" />
+        <register type="NOA" address="0x00009888" value="0x0F0700EF" />
+        <register type="NOA" address="0x00009888" value="0x25070000" />
+        <register type="NOA" address="0x00009888" value="0x11070000" />
+        <register type="NOA" address="0x00009888" value="0x23070000" />
+        <register type="NOA" address="0x00009888" value="0x1D070000" />
+        <register type="NOA" address="0x00009888" value="0x11004000" />
+        <register type="NOA" address="0x00009888" value="0x1F004000" />
+        <register type="NOA" address="0x00009888" value="0x21004000" />
+        <register type="NOA" address="0x00009888" value="0x23004000" />
+        <register type="NOA" address="0x00009888" value="0x25004000" />
+        <register type="NOA" address="0x00009888" value="0x27004000" />
+        <register type="NOA" address="0x00009888" value="0x29004000" />
+        <register type="NOA" address="0x00009888" value="0x2B004000" />
+        <register type="NOA" address="0x00009888" value="0x2D004000" />
+        <register type="NOA" address="0x00009888" value="0x2F004000" />
+        <register type="NOA" address="0x00009888" value="0x13004000" />
+        <register type="NOA" address="0x00009888" value="0x15004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47000000" />
+        <register type="NOA" address="0x00009888" value="0x39000003" />
+        <register type="NOA" address="0x00009888" value="0x49000000" />
+        <register type="NOA" address="0x00009888" value="0x3D000C63" />
+        <register type="NOA" address="0x00009888" value="0x4B000000" />
+        <register type="NOA" address="0x00009888" value="0x3F000C63" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000C63" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x0000081A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0000082A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x00000872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x000008BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0000087A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x000008EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x000008E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x000008F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00000065" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen10"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="63d18ead-3cfc-4972-a640-5e98b688dfee"
+       chipset="CNL"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes UADD $GtiL3Bank2Writes UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x17066860" />
+        <register type="NOA" address="0x00009888" value="0x15070017" />
+        <register type="NOA" address="0x00009888" value="0x1D073C00" />
+        <register type="NOA" address="0x00009888" value="0x1F07000E" />
+        <register type="NOA" address="0x00009888" value="0x1B038000" />
+        <register type="NOA" address="0x00009888" value="0x0D038000" />
+        <register type="NOA" address="0x00009888" value="0x0F034000" />
+        <register type="NOA" address="0x00009888" value="0x0F063180" />
+        <register type="NOA" address="0x00009888" value="0x01063100" />
+        <register type="NOA" address="0x00009888" value="0x0306006B" />
+        <register type="NOA" address="0x00009888" value="0x05060000" />
+        <register type="NOA" address="0x00009888" value="0x11080100" />
+        <register type="NOA" address="0x00009888" value="0x0D085000" />
+        <register type="NOA" address="0x00009888" value="0x0F094000" />
+        <register type="NOA" address="0x00009888" value="0x01094000" />
+        <register type="NOA" address="0x00009888" value="0x03091000" />
+        <register type="NOA" address="0x00009888" value="0x09046000" />
+        <register type="NOA" address="0x00009888" value="0x0F04A000" />
+        <register type="NOA" address="0x00009888" value="0x1104A800" />
+        <register type="NOA" address="0x00009888" value="0x130401AA" />
+        <register type="NOA" address="0x00009888" value="0x0B041000" />
+        <register type="NOA" address="0x00009888" value="0x010700D0" />
+        <register type="NOA" address="0x00009888" value="0x0707D153" />
+        <register type="NOA" address="0x00009888" value="0x0907D3D2" />
+        <register type="NOA" address="0x00009888" value="0x0B07D5D4" />
+        <register type="NOA" address="0x00009888" value="0x0D07D7D6" />
+        <register type="NOA" address="0x00009888" value="0x0F0700DF" />
+        <register type="NOA" address="0x00009888" value="0x25070000" />
+        <register type="NOA" address="0x00009888" value="0x11070000" />
+        <register type="NOA" address="0x00009888" value="0x23070000" />
+        <register type="NOA" address="0x00009888" value="0x11004000" />
+        <register type="NOA" address="0x00009888" value="0x1F004000" />
+        <register type="NOA" address="0x00009888" value="0x21004000" />
+        <register type="NOA" address="0x00009888" value="0x23004000" />
+        <register type="NOA" address="0x00009888" value="0x25004000" />
+        <register type="NOA" address="0x00009888" value="0x27004000" />
+        <register type="NOA" address="0x00009888" value="0x29004000" />
+        <register type="NOA" address="0x00009888" value="0x2B004000" />
+        <register type="NOA" address="0x00009888" value="0x2D004000" />
+        <register type="NOA" address="0x00009888" value="0x2F004000" />
+        <register type="NOA" address="0x00009888" value="0x13004000" />
+        <register type="NOA" address="0x00009888" value="0x15004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47000000" />
+        <register type="NOA" address="0x00009888" value="0x39000003" />
+        <register type="NOA" address="0x00009888" value="0x49000000" />
+        <register type="NOA" address="0x00009888" value="0x3D000C63" />
+        <register type="NOA" address="0x00009888" value="0x4B000000" />
+        <register type="NOA" address="0x00009888" value="0x3F000C63" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000C63" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x70800000" />
+        <register type="OA" address="0x00002770" value="0x0000081A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x00000822" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x000008BA" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0000087A" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x000008EA" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x000008E2" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x000008F2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x0000274C" value="0x65432108" />
+        <register type="OA" address="0x00002744" value="0x0000CCCE" />
+        <register type="OA" address="0x00002748" value="0x65432108" />
+        <register type="OA" address="0x0000275C" value="0x65432108" />
+        <register type="OA" address="0x00002754" value="0x000000CA" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen10"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="1b4d1280-6bbd-4d57-90c6-a03ed6059688"
+       chipset="CNL"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 FADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 13 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 FADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SubsliceMask 1 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x121A0007" />
+        <register type="NOA" address="0x00009888" value="0x101A0000" />
+        <register type="NOA" address="0x00009888" value="0x121B000B" />
+        <register type="NOA" address="0x00009888" value="0x161B0009" />
+        <register type="NOA" address="0x00009888" value="0x0474A000" />
+        <register type="NOA" address="0x00009888" value="0x0A748000" />
+        <register type="NOA" address="0x00009888" value="0x0C74A000" />
+        <register type="NOA" address="0x00009888" value="0x0E74A000" />
+        <register type="NOA" address="0x00009888" value="0x12741540" />
+        <register type="NOA" address="0x00009888" value="0x0674A000" />
+        <register type="NOA" address="0x00009888" value="0x08742000" />
+        <register type="NOA" address="0x00009888" value="0x0475A000" />
+        <register type="NOA" address="0x00009888" value="0x0A758000" />
+        <register type="NOA" address="0x00009888" value="0x0C75A000" />
+        <register type="NOA" address="0x00009888" value="0x0E75A000" />
+        <register type="NOA" address="0x00009888" value="0x147500AA" />
+        <register type="NOA" address="0x00009888" value="0x0675A000" />
+        <register type="NOA" address="0x00009888" value="0x08752000" />
+        <register type="NOA" address="0x00009888" value="0x0C76A800" />
+        <register type="NOA" address="0x00009888" value="0x0E76AA0A" />
+        <register type="NOA" address="0x00009888" value="0x107602AA" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E77C000" />
+        <register type="NOA" address="0x00009888" value="0x1477C000" />
+        <register type="NOA" address="0x00009888" value="0x1677FFF0" />
+        <register type="NOA" address="0x00009888" value="0x18770003" />
+        <register type="NOA" address="0x00009888" value="0x0277C000" />
+        <register type="NOA" address="0x00009888" value="0x0477C000" />
+        <register type="NOA" address="0x00009888" value="0x0677C000" />
+        <register type="NOA" address="0x00009888" value="0x0877C000" />
+        <register type="NOA" address="0x00009888" value="0x00198000" />
+        <register type="NOA" address="0x00009888" value="0x0E198000" />
+        <register type="NOA" address="0x00009888" value="0x1A195540" />
+        <register type="NOA" address="0x00009888" value="0x1C19003A" />
+        <register type="NOA" address="0x00009888" value="0x0219C000" />
+        <register type="NOA" address="0x00009888" value="0x0419C000" />
+        <register type="NOA" address="0x00009888" value="0x0619C000" />
+        <register type="NOA" address="0x00009888" value="0x0819C000" />
+        <register type="NOA" address="0x00009888" value="0x0E1A2A00" />
+        <register type="NOA" address="0x00009888" value="0x001A2980" />
+        <register type="NOA" address="0x00009888" value="0x021A2CDA" />
+        <register type="NOA" address="0x00009888" value="0x041A0058" />
+        <register type="NOA" address="0x00009888" value="0x001B0011" />
+        <register type="NOA" address="0x00009888" value="0x061B0900" />
+        <register type="NOA" address="0x00009888" value="0x081B0A13" />
+        <register type="NOA" address="0x00009888" value="0x0A1B0B15" />
+        <register type="NOA" address="0x00009888" value="0x0C1B2317" />
+        <register type="NOA" address="0x00009888" value="0x0E1B0043" />
+        <register type="NOA" address="0x00009888" value="0x101B0000" />
+        <register type="NOA" address="0x00009888" value="0x10178000" />
+        <register type="NOA" address="0x00009888" value="0x1C1701FE" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2100C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x47000000" />
+        <register type="NOA" address="0x00009888" value="0x39000420" />
+        <register type="NOA" address="0x00009888" value="0x49000000" />
+        <register type="NOA" address="0x00009888" value="0x3D000000" />
+        <register type="NOA" address="0x00009888" value="0x4B000000" />
+        <register type="NOA" address="0x00009888" value="0x3F000000" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000000" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000001" />
+        <register type="NOA" address="0x00009888" value="0x3B000021" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000C2A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x00000C6A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x00000C32" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x00000E6A" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x00000E7A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x00000C92" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x00000CA2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x00000C9A" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen10"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="f3b31b5a-00b3-4fb4-81fd-6446e505534c"
+       chipset="CNL"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 2 READ C 3 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank0."
+             data_type="uint64"
+             equation="B 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank1 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank1."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank2 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank2."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice1 L3 Bank0 Accesses"
+             description="The total number of accesses to Slice1 L3 Bank0."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank10_accesses"
+             units="messages"
+             symbol_name="L3Bank10Accesses"
+             availability="$SliceMask 2 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice1 L3 Bank1 Accesses"
+             description="The total number of accesses to Slice1 L3 Bank1."
+             data_type="uint64"
+             equation="B 4 READ 2 UMUL"
+             underscore_name="l3_bank11_accesses"
+             units="messages"
+             symbol_name="L3Bank11Accesses"
+             availability="$SliceMask 2 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice1 L3 Bank2 Accesses"
+             description="The total number of accesses to Slice1 L3 Bank2."
+             data_type="uint64"
+             equation="B 5 READ 2 UMUL"
+             underscore_name="l3_bank12_accesses"
+             units="messages"
+             symbol_name="L3Bank12Accesses"
+             availability="$SliceMask 2 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="$L3Bank00Accesses $L3Bank01Accesses UADD $L3Bank02Accesses UADD $L3Bank10Accesses UADD $L3Bank11Accesses UADD $L3Bank12Accesses UADD"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="64  $SliceMask 1 AND C 4 READ UMUL $SliceMask 1 >> 1 AND C 5 READ UMUL UADD 8 UMUL UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="$SamplerAccesses 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SliceMask 1 AND C 4 READ UMUL $SliceMask 1 >> 1 AND C 5 READ UMUL UADD 8 UMUL A 32 READ UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 6 READ UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  C 7 READ UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x146C0080" />
+        <register type="NOA" address="0x00009888" value="0x14EC0080" />
+        <register type="NOA" address="0x00009888" value="0x006C0050" />
+        <register type="NOA" address="0x00009888" value="0x066C5100" />
+        <register type="NOA" address="0x00009888" value="0x086C0052" />
+        <register type="NOA" address="0x00009888" value="0x026C5C00" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0800" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0540" />
+        <register type="NOA" address="0x00009888" value="0x00739000" />
+        <register type="NOA" address="0x00009888" value="0x02739000" />
+        <register type="NOA" address="0x00009888" value="0x0473F000" />
+        <register type="NOA" address="0x00009888" value="0x00778000" />
+        <register type="NOA" address="0x00009888" value="0x0E778000" />
+        <register type="NOA" address="0x00009888" value="0x14778000" />
+        <register type="NOA" address="0x00009888" value="0x167702A0" />
+        <register type="NOA" address="0x00009888" value="0x06778000" />
+        <register type="NOA" address="0x00009888" value="0x08778000" />
+        <register type="NOA" address="0x00009888" value="0x08EC5000" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5251" />
+        <register type="NOA" address="0x00009888" value="0x04EC005C" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1AEC0000" />
+        <register type="NOA" address="0x00009888" value="0x18EC0000" />
+        <register type="NOA" address="0x00009888" value="0x04F3E000" />
+        <register type="NOA" address="0x00009888" value="0x02F31000" />
+        <register type="NOA" address="0x00009888" value="0x16F702A0" />
+        <register type="NOA" address="0x00009888" value="0x08F78000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x0B080360" />
+        <register type="NOA" address="0x00009888" value="0x1D073800" />
+        <register type="NOA" address="0x00009888" value="0x1F070140" />
+        <register type="NOA" address="0x00009888" value="0x01081060" />
+        <register type="NOA" address="0x00009888" value="0x0D080000" />
+        <register type="NOA" address="0x00009888" value="0x01094000" />
+        <register type="NOA" address="0x00009888" value="0x03091000" />
+        <register type="NOA" address="0x00009888" value="0x09044000" />
+        <register type="NOA" address="0x00009888" value="0x0B041000" />
+        <register type="NOA" address="0x00009888" value="0x0D048000" />
+        <register type="NOA" address="0x00009888" value="0x0F042000" />
+        <register type="NOA" address="0x00009888" value="0x0507E700" />
+        <register type="NOA" address="0x00009888" value="0x070700D7" />
+        <register type="NOA" address="0x00009888" value="0x25070000" />
+        <register type="NOA" address="0x00009888" value="0x1B070000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2100C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x13004000" />
+        <register type="NOA" address="0x00009888" value="0x15004000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x1B004000" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009888" value="0x47001111" />
+        <register type="NOA" address="0x00009888" value="0x39002101" />
+        <register type="NOA" address="0x00009888" value="0x49001110" />
+        <register type="NOA" address="0x00009888" value="0x3D000429" />
+        <register type="NOA" address="0x00009888" value="0x4B000001" />
+        <register type="NOA" address="0x00009888" value="0x3F000000" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x3B002401" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="890094c5-8615-4f69-a8b9-706c5bcbd713"
+       chipset="CNL"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Slice0 Subslice1 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Subslice1)"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ B 5 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Subslice2 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Subslice2)"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ B 7 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Subslice0 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice1 Subslice0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ C 1 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader10_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader10AccessStalledOnL3"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Slice1 Subslice1 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice1 Subslice1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ C 3 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader11_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader11AccessStalledOnL3"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 Subslice0 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Subslice0)"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ B 3 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x121A0011" />
+        <register type="NOA" address="0x00009888" value="0x123A0011" />
+        <register type="NOA" address="0x00009888" value="0x129A0011" />
+        <register type="NOA" address="0x00009888" value="0x12BA0011" />
+        <register type="NOA" address="0x00009888" value="0x125A0011" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0005" />
+        <register type="NOA" address="0x00009888" value="0x186C00A0" />
+        <register type="NOA" address="0x00009888" value="0x0673C000" />
+        <register type="NOA" address="0x00009888" value="0x00736000" />
+        <register type="NOA" address="0x00009888" value="0x0C74A000" />
+        <register type="NOA" address="0x00009888" value="0x0C75A000" />
+        <register type="NOA" address="0x00009888" value="0x0E762800" />
+        <register type="NOA" address="0x00009888" value="0x1477C000" />
+        <register type="NOA" address="0x00009888" value="0x16779570" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x02778000" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x0A7B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C7B002A" />
+        <register type="NOA" address="0x00009888" value="0x147C8000" />
+        <register type="NOA" address="0x00009888" value="0x167C003E" />
+        <register type="NOA" address="0x00009888" value="0x1E7D0028" />
+        <register type="NOA" address="0x00009888" value="0x1A1901E0" />
+        <register type="NOA" address="0x00009888" value="0x081A2B50" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A391E00" />
+        <register type="NOA" address="0x00009888" value="0x0A3A2B50" />
+        <register type="NOA" address="0x00009888" value="0x003A0000" />
+        <register type="NOA" address="0x00009888" value="0x12F41400" />
+        <register type="NOA" address="0x00009888" value="0x14F500A0" />
+        <register type="NOA" address="0x00009888" value="0x10F60280" />
+        <register type="NOA" address="0x00009888" value="0x16F7C000" />
+        <register type="NOA" address="0x00009888" value="0x18F70003" />
+        <register type="NOA" address="0x00009888" value="0x02F74000" />
+        <register type="NOA" address="0x00009888" value="0x04F74000" />
+        <register type="NOA" address="0x00009888" value="0x08FBA000" />
+        <register type="NOA" address="0x00009888" value="0x02FC8000" />
+        <register type="NOA" address="0x00009888" value="0x04FC8000" />
+        <register type="NOA" address="0x00009888" value="0x1CFD000A" />
+        <register type="NOA" address="0x00009888" value="0x1C99003C" />
+        <register type="NOA" address="0x00009888" value="0x0E9A2B50" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x02B9C000" />
+        <register type="NOA" address="0x00009888" value="0x04B9C000" />
+        <register type="NOA" address="0x00009888" value="0x00BA2800" />
+        <register type="NOA" address="0x00009888" value="0x02BA0056" />
+        <register type="NOA" address="0x00009888" value="0x1A596000" />
+        <register type="NOA" address="0x00009888" value="0x1C590003" />
+        <register type="NOA" address="0x00009888" value="0x0C5A2B50" />
+        <register type="NOA" address="0x00009888" value="0x005A0000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x130E03C0" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x01181000" />
+        <register type="NOA" address="0x00009888" value="0x010E0030" />
+        <register type="NOA" address="0x00009888" value="0x110E0000" />
+        <register type="NOA" address="0x00009888" value="0x01104000" />
+        <register type="NOA" address="0x00009888" value="0x01118000" />
+        <register type="NOA" address="0x00009888" value="0x0B142000" />
+        <register type="NOA" address="0x00009888" value="0x01092000" />
+        <register type="NOA" address="0x00009888" value="0x010B4000" />
+        <register type="NOA" address="0x00009888" value="0x09041000" />
+        <register type="NOA" address="0x00009888" value="0x1D000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x11004000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x47000003" />
+        <register type="NOA" address="0x00009888" value="0x39000000" />
+        <register type="NOA" address="0x00009888" value="0x4B001111" />
+        <register type="NOA" address="0x00009888" value="0x3D000408" />
+        <register type="NOA" address="0x00009888" value="0x3F000421" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000084" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000000" />
+        <register type="NOA" address="0x00009888" value="0x49000300" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FFFE" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="e56f7dd7-ff55-4bae-89a1-a526a2e3b0d6"
+       chipset="CNL"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank2 Stalled"
+             description="The percentage of time in which slice1 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_stalled"
+             units="percent"
+             symbol_name="L31Bank2Stalled"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x1661001A" />
+        <register type="NOA" address="0x00009888" value="0x1665001A" />
+        <register type="NOA" address="0x00009888" value="0x1669001A" />
+        <register type="NOA" address="0x00009888" value="0x106C1C00" />
+        <register type="NOA" address="0x00009888" value="0x126C0004" />
+        <register type="NOA" address="0x00009888" value="0x166C001D" />
+        <register type="NOA" address="0x00009888" value="0x10EC0400" />
+        <register type="NOA" address="0x00009888" value="0x16EC0000" />
+        <register type="NOA" address="0x00009888" value="0x02610024" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x1E610000" />
+        <register type="NOA" address="0x00009888" value="0x02652400" />
+        <register type="NOA" address="0x00009888" value="0x10650000" />
+        <register type="NOA" address="0x00009888" value="0x1E650000" />
+        <register type="NOA" address="0x00009888" value="0x04690024" />
+        <register type="NOA" address="0x00009888" value="0x10690000" />
+        <register type="NOA" address="0x00009888" value="0x1E690000" />
+        <register type="NOA" address="0x00009888" value="0x006C0020" />
+        <register type="NOA" address="0x00009888" value="0x066C2800" />
+        <register type="NOA" address="0x00009888" value="0x0A6C2820" />
+        <register type="NOA" address="0x00009888" value="0x0E6C3832" />
+        <register type="NOA" address="0x00009888" value="0x186C05A0" />
+        <register type="NOA" address="0x00009888" value="0x1A6C1010" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x186D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A6E1000" />
+        <register type="NOA" address="0x00009888" value="0x0073F000" />
+        <register type="NOA" address="0x00009888" value="0x02738000" />
+        <register type="NOA" address="0x00009888" value="0x0473D000" />
+        <register type="NOA" address="0x00009888" value="0x0673D000" />
+        <register type="NOA" address="0x00009888" value="0x00778000" />
+        <register type="NOA" address="0x00009888" value="0x0E778000" />
+        <register type="NOA" address="0x00009888" value="0x14778000" />
+        <register type="NOA" address="0x00009888" value="0x16778A80" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x02778000" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x06778000" />
+        <register type="NOA" address="0x00009888" value="0x08774000" />
+        <register type="NOA" address="0x00009888" value="0x04784000" />
+        <register type="NOA" address="0x00009888" value="0x0A7B0004" />
+        <register type="NOA" address="0x00009888" value="0x08EC0020" />
+        <register type="NOA" address="0x00009888" value="0x0CEC0020" />
+        <register type="NOA" address="0x00009888" value="0x00EC3600" />
+        <register type="NOA" address="0x00009888" value="0x1AEC0000" />
+        <register type="NOA" address="0x00009888" value="0x18EC0000" />
+        <register type="NOA" address="0x00009888" value="0x04F31000" />
+        <register type="NOA" address="0x00009888" value="0x06F31000" />
+        <register type="NOA" address="0x00009888" value="0x00F32000" />
+        <register type="NOA" address="0x00009888" value="0x14F78000" />
+        <register type="NOA" address="0x00009888" value="0x16F70800" />
+        <register type="NOA" address="0x00009888" value="0x02F78000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x1D000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x47000101" />
+        <register type="NOA" address="0x00009888" value="0x39000001" />
+        <register type="NOA" address="0x00009888" value="0x49001300" />
+        <register type="NOA" address="0x00009888" value="0x3D000021" />
+        <register type="NOA" address="0x00009888" value="0x4B001100" />
+        <register type="NOA" address="0x00009888" value="0x3F000420" />
+        <register type="NOA" address="0x00009888" value="0x4D001100" />
+        <register type="NOA" address="0x00009888" value="0x41000400" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000001" />
+        <register type="NOA" address="0x00009888" value="0x3B0000C7" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x20000801" />
+        <register type="OA" address="0x00002774" value="0x0111FEEE" />
+        <register type="OA" address="0x00002778" value="0x40001001" />
+        <register type="OA" address="0x0000277C" value="0x0222FDDD" />
+        <register type="OA" address="0x00002780" value="0x80002002" />
+        <register type="OA" address="0x00002784" value="0x0444FBBB" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="918834e2-a1a4-4d77-9f3a-0c229f8d803f"
+       chipset="CNL"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank1 Stalled"
+             description="The percentage of time in which slice1 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_stalled"
+             units="percent"
+             symbol_name="L31Bank1Stalled"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice1 L3 Bank0 Stalled"
+             description="The percentage of time in which slice1 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_stalled"
+             units="percent"
+             symbol_name="L31Bank0Stalled"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank2 Active"
+             description="The percentage of time in which slice1 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank2_active"
+             units="percent"
+             symbol_name="L31Bank2Active"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice1 L3 Bank1 Active"
+             description="The percentage of time in which slice1 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank1_active"
+             units="percent"
+             symbol_name="L31Bank1Active"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 L3 Bank0 Active"
+             description="The percentage of time in which slice1 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l31_bank0_active"
+             units="percent"
+             symbol_name="L31Bank0Active"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x106C0400" />
+        <register type="NOA" address="0x00009888" value="0x166C0000" />
+        <register type="NOA" address="0x00009888" value="0x16E1001A" />
+        <register type="NOA" address="0x00009888" value="0x16E5001A" />
+        <register type="NOA" address="0x00009888" value="0x16E9001A" />
+        <register type="NOA" address="0x00009888" value="0x10EC1C00" />
+        <register type="NOA" address="0x00009888" value="0x12EC0004" />
+        <register type="NOA" address="0x00009888" value="0x16EC001D" />
+        <register type="NOA" address="0x00009888" value="0x086C0020" />
+        <register type="NOA" address="0x00009888" value="0x0C6C0020" />
+        <register type="NOA" address="0x00009888" value="0x006C3600" />
+        <register type="NOA" address="0x00009888" value="0x186C0A88" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0504" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0005" />
+        <register type="NOA" address="0x00009888" value="0x0073F000" />
+        <register type="NOA" address="0x00009888" value="0x02739000" />
+        <register type="NOA" address="0x00009888" value="0x0473D000" />
+        <register type="NOA" address="0x00009888" value="0x0673D000" />
+        <register type="NOA" address="0x00009888" value="0x00778000" />
+        <register type="NOA" address="0x00009888" value="0x0E778000" />
+        <register type="NOA" address="0x00009888" value="0x14778000" />
+        <register type="NOA" address="0x00009888" value="0x16778A80" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x02778000" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x06778000" />
+        <register type="NOA" address="0x00009888" value="0x08778000" />
+        <register type="NOA" address="0x00009888" value="0x02E10024" />
+        <register type="NOA" address="0x00009888" value="0x10E10000" />
+        <register type="NOA" address="0x00009888" value="0x1EE10000" />
+        <register type="NOA" address="0x00009888" value="0x02E52400" />
+        <register type="NOA" address="0x00009888" value="0x10E50000" />
+        <register type="NOA" address="0x00009888" value="0x1EE50000" />
+        <register type="NOA" address="0x00009888" value="0x04E90024" />
+        <register type="NOA" address="0x00009888" value="0x10E90000" />
+        <register type="NOA" address="0x00009888" value="0x1EE90000" />
+        <register type="NOA" address="0x00009888" value="0x00EC0020" />
+        <register type="NOA" address="0x00009888" value="0x06EC2800" />
+        <register type="NOA" address="0x00009888" value="0x0AEC2820" />
+        <register type="NOA" address="0x00009888" value="0x0EEC3832" />
+        <register type="NOA" address="0x00009888" value="0x18EC0580" />
+        <register type="NOA" address="0x00009888" value="0x1AEC0000" />
+        <register type="NOA" address="0x00009888" value="0x1CEC0000" />
+        <register type="NOA" address="0x00009888" value="0x18ED8000" />
+        <register type="NOA" address="0x00009888" value="0x0AEE1000" />
+        <register type="NOA" address="0x00009888" value="0x00F3D000" />
+        <register type="NOA" address="0x00009888" value="0x02F38000" />
+        <register type="NOA" address="0x00009888" value="0x04F3C000" />
+        <register type="NOA" address="0x00009888" value="0x06F3C000" />
+        <register type="NOA" address="0x00009888" value="0x00F78000" />
+        <register type="NOA" address="0x00009888" value="0x0EF78000" />
+        <register type="NOA" address="0x00009888" value="0x16F78280" />
+        <register type="NOA" address="0x00009888" value="0x18F70002" />
+        <register type="NOA" address="0x00009888" value="0x04F78000" />
+        <register type="NOA" address="0x00009888" value="0x06F78000" />
+        <register type="NOA" address="0x00009888" value="0x08F74000" />
+        <register type="NOA" address="0x00009888" value="0x04F84000" />
+        <register type="NOA" address="0x00009888" value="0x0AFB0004" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x1D000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x47000010" />
+        <register type="NOA" address="0x00009888" value="0x39000883" />
+        <register type="NOA" address="0x00009888" value="0x49000300" />
+        <register type="NOA" address="0x00009888" value="0x3D001064" />
+        <register type="NOA" address="0x00009888" value="0x4B000001" />
+        <register type="NOA" address="0x00009888" value="0x3F000C60" />
+        <register type="NOA" address="0x00009888" value="0x4D000001" />
+        <register type="NOA" address="0x00009888" value="0x41000C04" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000003" />
+        <register type="NOA" address="0x00009888" value="0x3B000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x20000801" />
+        <register type="OA" address="0x00002774" value="0x0111FEEE" />
+        <register type="OA" address="0x00002778" value="0x40001001" />
+        <register type="OA" address="0x0000277C" value="0x0222FDDD" />
+        <register type="OA" address="0x00002780" value="0x80002002" />
+        <register type="OA" address="0x00002784" value="0x0444FBBB" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="2e95713a-c6d8-47a9-9207-eba3e208be51"
+       chipset="CNL"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Rasterizer Input Available"
+             description="The percentage of time in which slice1 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_input_available"
+             units="percent"
+             symbol_name="Rasterizer1InputAvailable"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Pixel Values Ready"
+             description="The percentage of time in which slice1 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values1_ready"
+             units="percent"
+             symbol_name="PixelValues1Ready"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 PS Output Available"
+             description="The percentage of time in which slice1 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output1_available"
+             units="percent"
+             symbol_name="PSOutput1Available"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice1 Rasterizer Output Ready"
+             description="The percentage of time in which slice1 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer1_output_ready"
+             units="percent"
+             symbol_name="Rasterizer1OutputReady"
+             availability="$SliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice1 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice1 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data1_ready"
+             units="percent"
+             symbol_name="PixelData1Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x0C710004" />
+        <register type="NOA" address="0x00009888" value="0x10747000" />
+        <register type="NOA" address="0x00009888" value="0x12756800" />
+        <register type="NOA" address="0x00009888" value="0x04795000" />
+        <register type="NOA" address="0x00009888" value="0x127C01C0" />
+        <register type="NOA" address="0x00009888" value="0x0CF10004" />
+        <register type="NOA" address="0x00009888" value="0x10F47000" />
+        <register type="NOA" address="0x00009888" value="0x12F56800" />
+        <register type="NOA" address="0x00009888" value="0x04F95000" />
+        <register type="NOA" address="0x00009888" value="0x12FC01C0" />
+        <register type="NOA" address="0x00009888" value="0x1A6C4044" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0004" />
+        <register type="NOA" address="0x00009888" value="0x186C00A0" />
+        <register type="NOA" address="0x00009888" value="0x00710010" />
+        <register type="NOA" address="0x00009888" value="0x02738000" />
+        <register type="NOA" address="0x00009888" value="0x04732000" />
+        <register type="NOA" address="0x00009888" value="0x0673A000" />
+        <register type="NOA" address="0x00009888" value="0x00736000" />
+        <register type="NOA" address="0x00009888" value="0x08740037" />
+        <register type="NOA" address="0x00009888" value="0x0C740000" />
+        <register type="NOA" address="0x00009888" value="0x0A750F36" />
+        <register type="NOA" address="0x00009888" value="0x10750000" />
+        <register type="NOA" address="0x00009888" value="0x04751000" />
+        <register type="NOA" address="0x00009888" value="0x0C752000" />
+        <register type="NOA" address="0x00009888" value="0x0E750000" />
+        <register type="NOA" address="0x00009888" value="0x0C760800" />
+        <register type="NOA" address="0x00009888" value="0x0E768800" />
+        <register type="NOA" address="0x00009888" value="0x10760002" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E778000" />
+        <register type="NOA" address="0x00009888" value="0x1477C000" />
+        <register type="NOA" address="0x00009888" value="0x167767E0" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x02778000" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x0C790017" />
+        <register type="NOA" address="0x00009888" value="0x08790000" />
+        <register type="NOA" address="0x00009888" value="0x0C7B0088" />
+        <register type="NOA" address="0x00009888" value="0x0E7C0032" />
+        <register type="NOA" address="0x00009888" value="0x107C0000" />
+        <register type="NOA" address="0x00009888" value="0x167C0004" />
+        <register type="NOA" address="0x00009888" value="0x04F10200" />
+        <register type="NOA" address="0x00009888" value="0x00F10000" />
+        <register type="NOA" address="0x00009888" value="0x08F40DC0" />
+        <register type="NOA" address="0x00009888" value="0x0CF40000" />
+        <register type="NOA" address="0x00009888" value="0x00F50D80" />
+        <register type="NOA" address="0x00009888" value="0x02F5003C" />
+        <register type="NOA" address="0x00009888" value="0x10F50000" />
+        <register type="NOA" address="0x00009888" value="0x0AF54000" />
+        <register type="NOA" address="0x00009888" value="0x0CF58000" />
+        <register type="NOA" address="0x00009888" value="0x04F50000" />
+        <register type="NOA" address="0x00009888" value="0x06F50000" />
+        <register type="NOA" address="0x00009888" value="0x0EF62200" />
+        <register type="NOA" address="0x00009888" value="0x0CF6A000" />
+        <register type="NOA" address="0x00009888" value="0x0EF7C000" />
+        <register type="NOA" address="0x00009888" value="0x16F71030" />
+        <register type="NOA" address="0x00009888" value="0x18F70001" />
+        <register type="NOA" address="0x00009888" value="0x02F7C000" />
+        <register type="NOA" address="0x00009888" value="0x04F7C000" />
+        <register type="NOA" address="0x00009888" value="0x0CF905C0" />
+        <register type="NOA" address="0x00009888" value="0x08F90000" />
+        <register type="NOA" address="0x00009888" value="0x0CFB0220" />
+        <register type="NOA" address="0x00009888" value="0x0EFC1900" />
+        <register type="NOA" address="0x00009888" value="0x10FC0000" />
+        <register type="NOA" address="0x00009888" value="0x16FC0010" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x1D000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x47000001" />
+        <register type="NOA" address="0x00009888" value="0x39000421" />
+        <register type="NOA" address="0x00009888" value="0x49000300" />
+        <register type="NOA" address="0x00009888" value="0x3D000402" />
+        <register type="NOA" address="0x00009888" value="0x4B001101" />
+        <register type="NOA" address="0x00009888" value="0x3F000840" />
+        <register type="NOA" address="0x00009888" value="0x4D000101" />
+        <register type="NOA" address="0x00009888" value="0x41000801" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000180" />
+        <register type="OA" address="0x00002774" value="0x0000FFCF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFFE" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FFFD" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="9bcf4ff2-c15f-4bea-8ec8-8db87791942e"
+       chipset="CNL"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Slice1 Subslice0 Input Available"
+             description="The percentage of time in which slice1 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_input_available"
+             units="percent"
+             symbol_name="Sampler10InputAvailable"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice1 Subslice1 Input Available"
+             description="The percentage of time in which slice1 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_input_available"
+             units="percent"
+             symbol_name="Sampler11InputAvailable"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice1 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler10_output_ready"
+             units="percent"
+             symbol_name="Sampler10OutputReady"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Slice1 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice1 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler11_output_ready"
+             units="percent"
+             symbol_name="Sampler11OutputReady"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14141400" />
+        <register type="NOA" address="0x00009888" value="0x1614000B" />
+        <register type="NOA" address="0x00009888" value="0x14161400" />
+        <register type="NOA" address="0x00009888" value="0x14341400" />
+        <register type="NOA" address="0x00009888" value="0x1634000B" />
+        <register type="NOA" address="0x00009888" value="0x14361400" />
+        <register type="NOA" address="0x00009888" value="0x14941400" />
+        <register type="NOA" address="0x00009888" value="0x1694000B" />
+        <register type="NOA" address="0x00009888" value="0x14961400" />
+        <register type="NOA" address="0x00009888" value="0x14B41400" />
+        <register type="NOA" address="0x00009888" value="0x16B4000B" />
+        <register type="NOA" address="0x00009888" value="0x14B61400" />
+        <register type="NOA" address="0x00009888" value="0x14541400" />
+        <register type="NOA" address="0x00009888" value="0x1654000B" />
+        <register type="NOA" address="0x00009888" value="0x14561400" />
+        <register type="NOA" address="0x00009888" value="0x1A6C5000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0005" />
+        <register type="NOA" address="0x00009888" value="0x186C0280" />
+        <register type="NOA" address="0x00009888" value="0x0673F000" />
+        <register type="NOA" address="0x00009888" value="0x0073C000" />
+        <register type="NOA" address="0x00009888" value="0x04742000" />
+        <register type="NOA" address="0x00009888" value="0x0A74A000" />
+        <register type="NOA" address="0x00009888" value="0x04752000" />
+        <register type="NOA" address="0x00009888" value="0x0A75A000" />
+        <register type="NOA" address="0x00009888" value="0x0C760800" />
+        <register type="NOA" address="0x00009888" value="0x0E760280" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E77C000" />
+        <register type="NOA" address="0x00009888" value="0x14774000" />
+        <register type="NOA" address="0x00009888" value="0x1677A950" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x04778000" />
+        <register type="NOA" address="0x00009888" value="0x06778000" />
+        <register type="NOA" address="0x00009888" value="0x08774000" />
+        <register type="NOA" address="0x00009888" value="0x0A774000" />
+        <register type="NOA" address="0x00009888" value="0x0C77C000" />
+        <register type="NOA" address="0x00009888" value="0x0A7BA828" />
+        <register type="NOA" address="0x00009888" value="0x0C7B0002" />
+        <register type="NOA" address="0x00009888" value="0x147CE800" />
+        <register type="NOA" address="0x00009888" value="0x167C0003" />
+        <register type="NOA" address="0x00009888" value="0x087CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A7C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C7D8200" />
+        <register type="NOA" address="0x00009888" value="0x1E7D0002" />
+        <register type="NOA" address="0x00009888" value="0x00194000" />
+        <register type="NOA" address="0x00009888" value="0x0E194000" />
+        <register type="NOA" address="0x00009888" value="0x0C194000" />
+        <register type="NOA" address="0x00009888" value="0x00140050" />
+        <register type="NOA" address="0x00009888" value="0x06145800" />
+        <register type="NOA" address="0x00009888" value="0x10140000" />
+        <register type="NOA" address="0x00009888" value="0x18140000" />
+        <register type="NOA" address="0x00009888" value="0x1C140080" />
+        <register type="NOA" address="0x00009888" value="0x0A150001" />
+        <register type="NOA" address="0x00009888" value="0x06160043" />
+        <register type="NOA" address="0x00009888" value="0x10160000" />
+        <register type="NOA" address="0x00009888" value="0x0C160000" />
+        <register type="NOA" address="0x00009888" value="0x1A3900A0" />
+        <register type="NOA" address="0x00009888" value="0x0A394000" />
+        <register type="NOA" address="0x00009888" value="0x08345850" />
+        <register type="NOA" address="0x00009888" value="0x10340000" />
+        <register type="NOA" address="0x00009888" value="0x1C340020" />
+        <register type="NOA" address="0x00009888" value="0x08358000" />
+        <register type="NOA" address="0x00009888" value="0x04362180" />
+        <register type="NOA" address="0x00009888" value="0x10360000" />
+        <register type="NOA" address="0x00009888" value="0x0A360000" />
+        <register type="NOA" address="0x00009888" value="0x12F40140" />
+        <register type="NOA" address="0x00009888" value="0x06F48000" />
+        <register type="NOA" address="0x00009888" value="0x14F5000A" />
+        <register type="NOA" address="0x00009888" value="0x06F58000" />
+        <register type="NOA" address="0x00009888" value="0x10F60028" />
+        <register type="NOA" address="0x00009888" value="0x0EF60002" />
+        <register type="NOA" address="0x00009888" value="0x16F77C00" />
+        <register type="NOA" address="0x00009888" value="0x18F70001" />
+        <register type="NOA" address="0x00009888" value="0x04F74000" />
+        <register type="NOA" address="0x00009888" value="0x06F7C000" />
+        <register type="NOA" address="0x00009888" value="0x0CFB0280" />
+        <register type="NOA" address="0x00009888" value="0x08FB8000" />
+        <register type="NOA" address="0x00009888" value="0x16FC0280" />
+        <register type="NOA" address="0x00009888" value="0x04FC8000" />
+        <register type="NOA" address="0x00009888" value="0x1EFD2800" />
+        <register type="NOA" address="0x00009888" value="0x1CFD0008" />
+        <register type="NOA" address="0x00009888" value="0x1A992000" />
+        <register type="NOA" address="0x00009888" value="0x1C990001" />
+        <register type="NOA" address="0x00009888" value="0x06994000" />
+        <register type="NOA" address="0x00009888" value="0x0C945850" />
+        <register type="NOA" address="0x00009888" value="0x10940000" />
+        <register type="NOA" address="0x00009888" value="0x1E940000" />
+        <register type="NOA" address="0x00009888" value="0x1C940002" />
+        <register type="NOA" address="0x00009888" value="0x08952000" />
+        <register type="NOA" address="0x00009888" value="0x02962180" />
+        <register type="NOA" address="0x00009888" value="0x10960000" />
+        <register type="NOA" address="0x00009888" value="0x06960000" />
+        <register type="NOA" address="0x00009888" value="0x1CB90014" />
+        <register type="NOA" address="0x00009888" value="0x04B94000" />
+        <register type="NOA" address="0x00009888" value="0x0EB45850" />
+        <register type="NOA" address="0x00009888" value="0x10B40000" />
+        <register type="NOA" address="0x00009888" value="0x1EB40000" />
+        <register type="NOA" address="0x00009888" value="0x1AB48000" />
+        <register type="NOA" address="0x00009888" value="0x08B51000" />
+        <register type="NOA" address="0x00009888" value="0x02B60043" />
+        <register type="NOA" address="0x00009888" value="0x10B60000" />
+        <register type="NOA" address="0x00009888" value="0x04B60000" />
+        <register type="NOA" address="0x00009888" value="0x1A590A00" />
+        <register type="NOA" address="0x00009888" value="0x08594000" />
+        <register type="NOA" address="0x00009888" value="0x0A545850" />
+        <register type="NOA" address="0x00009888" value="0x10540000" />
+        <register type="NOA" address="0x00009888" value="0x1C540008" />
+        <register type="NOA" address="0x00009888" value="0x1E540000" />
+        <register type="NOA" address="0x00009888" value="0x08554000" />
+        <register type="NOA" address="0x00009888" value="0x04560043" />
+        <register type="NOA" address="0x00009888" value="0x10560000" />
+        <register type="NOA" address="0x00009888" value="0x08560000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x13000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x1B00C000" />
+        <register type="NOA" address="0x00009888" value="0x1D00C000" />
+        <register type="NOA" address="0x00009888" value="0x47000031" />
+        <register type="NOA" address="0x00009888" value="0x39000143" />
+        <register type="NOA" address="0x00009888" value="0x49001110" />
+        <register type="NOA" address="0x00009888" value="0x3D000C61" />
+        <register type="NOA" address="0x00009888" value="0x4B000011" />
+        <register type="NOA" address="0x00009888" value="0x3F0018C3" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000842" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000002" />
+        <register type="NOA" address="0x00009888" value="0x3B000480" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x10800000" />
+        <register type="OA" address="0x00002770" value="0x00000018" />
+        <register type="OA" address="0x00002774" value="0x0000FFFC" />
+        <register type="OA" address="0x00002778" value="0x00000060" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF3" />
+        <register type="OA" address="0x00002780" value="0x00000180" />
+        <register type="OA" address="0x00002784" value="0x0000FFCF" />
+        <register type="OA" address="0x00002788" value="0x00000600" />
+        <register type="OA" address="0x0000278C" value="0x0000FF3F" />
+        <register type="OA" address="0x00002790" value="0x00001800" />
+        <register type="OA" address="0x00002794" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="c46c7bb5-f26d-4634-b491-902394af85b1"
+       chipset="CNL"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread11ReadyForDispatch"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="1  C 4 READ $GpuCoreClocks FDIV FSUB"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="1  C 5 READ $GpuCoreClocks FDIV FSUB"
+             underscore_name="non_ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread10ReadyForDispatch"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="1  C 2 READ $GpuCoreClocks FDIV FSUB"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice1 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice1 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread10_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread10ReadyForDispatch"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice1 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice1 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="1  C 6 READ $GpuCoreClocks FDIV FSUB"
+             underscore_name="non_ps_thread11_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread11ReadyForDispatch"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="1  C 3 READ $GpuCoreClocks FDIV FSUB"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x12180000" />
+        <register type="NOA" address="0x00009888" value="0x12380000" />
+        <register type="NOA" address="0x00009888" value="0x12980000" />
+        <register type="NOA" address="0x00009888" value="0x12B80000" />
+        <register type="NOA" address="0x00009888" value="0x12580000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C5000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0005" />
+        <register type="NOA" address="0x00009888" value="0x186C2800" />
+        <register type="NOA" address="0x00009888" value="0x0673F000" />
+        <register type="NOA" address="0x00009888" value="0x02733000" />
+        <register type="NOA" address="0x00009888" value="0x0474A000" />
+        <register type="NOA" address="0x00009888" value="0x0A748000" />
+        <register type="NOA" address="0x00009888" value="0x0475A000" />
+        <register type="NOA" address="0x00009888" value="0x0A758000" />
+        <register type="NOA" address="0x00009888" value="0x0C762800" />
+        <register type="NOA" address="0x00009888" value="0x0E760200" />
+        <register type="NOA" address="0x00009888" value="0x0077C000" />
+        <register type="NOA" address="0x00009888" value="0x0E77C000" />
+        <register type="NOA" address="0x00009888" value="0x14774000" />
+        <register type="NOA" address="0x00009888" value="0x1677A950" />
+        <register type="NOA" address="0x00009888" value="0x18770002" />
+        <register type="NOA" address="0x00009888" value="0x0277C000" />
+        <register type="NOA" address="0x00009888" value="0x04774000" />
+        <register type="NOA" address="0x00009888" value="0x06774000" />
+        <register type="NOA" address="0x00009888" value="0x08778000" />
+        <register type="NOA" address="0x00009888" value="0x0A778000" />
+        <register type="NOA" address="0x00009888" value="0x0A7BA802" />
+        <register type="NOA" address="0x00009888" value="0x0C7B0002" />
+        <register type="NOA" address="0x00009888" value="0x087B8000" />
+        <register type="NOA" address="0x00009888" value="0x147CE800" />
+        <register type="NOA" address="0x00009888" value="0x167C0003" />
+        <register type="NOA" address="0x00009888" value="0x047C8000" />
+        <register type="NOA" address="0x00009888" value="0x067CC000" />
+        <register type="NOA" address="0x00009888" value="0x1C7D8008" />
+        <register type="NOA" address="0x00009888" value="0x1E7D0002" />
+        <register type="NOA" address="0x00009888" value="0x00194000" />
+        <register type="NOA" address="0x00009888" value="0x0E194000" />
+        <register type="NOA" address="0x00009888" value="0x02194000" />
+        <register type="NOA" address="0x00009888" value="0x18148000" />
+        <register type="NOA" address="0x00009888" value="0x1C140200" />
+        <register type="NOA" address="0x00009888" value="0x1A142000" />
+        <register type="NOA" address="0x00009888" value="0x0015C000" />
+        <register type="NOA" address="0x00009888" value="0x0A150002" />
+        <register type="NOA" address="0x00009888" value="0x00168000" />
+        <register type="NOA" address="0x00009888" value="0x0E168000" />
+        <register type="NOA" address="0x00009888" value="0x02168000" />
+        <register type="NOA" address="0x00009888" value="0x0018A1A3" />
+        <register type="NOA" address="0x00009888" value="0x0618A500" />
+        <register type="NOA" address="0x00009888" value="0x10180000" />
+        <register type="NOA" address="0x00009888" value="0x1A3900A0" />
+        <register type="NOA" address="0x00009888" value="0x04394000" />
+        <register type="NOA" address="0x00009888" value="0x1C342800" />
+        <register type="NOA" address="0x00009888" value="0x1A348000" />
+        <register type="NOA" address="0x00009888" value="0x0A35000C" />
+        <register type="NOA" address="0x00009888" value="0x08351000" />
+        <register type="NOA" address="0x00009888" value="0x1A360140" />
+        <register type="NOA" address="0x00009888" value="0x04368000" />
+        <register type="NOA" address="0x00009888" value="0x0838A5A3" />
+        <register type="NOA" address="0x00009888" value="0x023800A1" />
+        <register type="NOA" address="0x00009888" value="0x10380000" />
+        <register type="NOA" address="0x00009888" value="0x12F40140" />
+        <register type="NOA" address="0x00009888" value="0x08F42000" />
+        <register type="NOA" address="0x00009888" value="0x14F5000A" />
+        <register type="NOA" address="0x00009888" value="0x08F52000" />
+        <register type="NOA" address="0x00009888" value="0x10F60028" />
+        <register type="NOA" address="0x00009888" value="0x0EF60008" />
+        <register type="NOA" address="0x00009888" value="0x16F77C00" />
+        <register type="NOA" address="0x00009888" value="0x18F70001" />
+        <register type="NOA" address="0x00009888" value="0x08F7C000" />
+        <register type="NOA" address="0x00009888" value="0x0AF74000" />
+        <register type="NOA" address="0x00009888" value="0x0CFB0280" />
+        <register type="NOA" address="0x00009888" value="0x0AFB0020" />
+        <register type="NOA" address="0x00009888" value="0x16FC0280" />
+        <register type="NOA" address="0x00009888" value="0x0AFC8000" />
+        <register type="NOA" address="0x00009888" value="0x1EFD2800" />
+        <register type="NOA" address="0x00009888" value="0x1CFD0200" />
+        <register type="NOA" address="0x00009888" value="0x1A992000" />
+        <register type="NOA" address="0x00009888" value="0x1C990001" />
+        <register type="NOA" address="0x00009888" value="0x08994000" />
+        <register type="NOA" address="0x00009888" value="0x1E940028" />
+        <register type="NOA" address="0x00009888" value="0x1C940008" />
+        <register type="NOA" address="0x00009888" value="0x0A9500C0" />
+        <register type="NOA" address="0x00009888" value="0x08954000" />
+        <register type="NOA" address="0x00009888" value="0x1A964000" />
+        <register type="NOA" address="0x00009888" value="0x1C960002" />
+        <register type="NOA" address="0x00009888" value="0x08968000" />
+        <register type="NOA" address="0x00009888" value="0x0C98A5A3" />
+        <register type="NOA" address="0x00009888" value="0x049800A1" />
+        <register type="NOA" address="0x00009888" value="0x10980000" />
+        <register type="NOA" address="0x00009888" value="0x1CB90014" />
+        <register type="NOA" address="0x00009888" value="0x0AB94000" />
+        <register type="NOA" address="0x00009888" value="0x1EB40280" />
+        <register type="NOA" address="0x00009888" value="0x1CB40020" />
+        <register type="NOA" address="0x00009888" value="0x0AB50300" />
+        <register type="NOA" address="0x00009888" value="0x08B58000" />
+        <register type="NOA" address="0x00009888" value="0x1CB60028" />
+        <register type="NOA" address="0x00009888" value="0x0AB68000" />
+        <register type="NOA" address="0x00009888" value="0x0EB8A5A3" />
+        <register type="NOA" address="0x00009888" value="0x04B8A100" />
+        <register type="NOA" address="0x00009888" value="0x10B80000" />
+        <register type="NOA" address="0x00009888" value="0x1A590A00" />
+        <register type="NOA" address="0x00009888" value="0x06594000" />
+        <register type="NOA" address="0x00009888" value="0x1C548002" />
+        <register type="NOA" address="0x00009888" value="0x1E540002" />
+        <register type="NOA" address="0x00009888" value="0x0A550030" />
+        <register type="NOA" address="0x00009888" value="0x08552000" />
+        <register type="NOA" address="0x00009888" value="0x1A561400" />
+        <register type="NOA" address="0x00009888" value="0x06568000" />
+        <register type="NOA" address="0x00009888" value="0x0A58A5A3" />
+        <register type="NOA" address="0x00009888" value="0x0258A100" />
+        <register type="NOA" address="0x00009888" value="0x10580000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x2100F000" />
+        <register type="NOA" address="0x00009888" value="0x1D000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x1100C000" />
+        <register type="NOA" address="0x00009888" value="0x1F00C000" />
+        <register type="NOA" address="0x00009888" value="0x2300C000" />
+        <register type="NOA" address="0x00009888" value="0x2500C000" />
+        <register type="NOA" address="0x00009888" value="0x2700C000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x1B00C000" />
+        <register type="NOA" address="0x00009888" value="0x47000111" />
+        <register type="NOA" address="0x00009888" value="0x39000421" />
+        <register type="NOA" address="0x00009888" value="0x49001300" />
+        <register type="NOA" address="0x00009888" value="0x3D00042B" />
+        <register type="NOA" address="0x00009888" value="0x4B000011" />
+        <register type="NOA" address="0x00009888" value="0x3F001081" />
+        <register type="NOA" address="0x00009888" value="0x4D000000" />
+        <register type="NOA" address="0x00009888" value="0x41000000" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000000" />
+        <register type="NOA" address="0x00009888" value="0x3B000004" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x10800000" />
+        <register type="OA" address="0x00002770" value="0x00000000" />
+        <register type="OA" address="0x00002774" value="0x0000FFFC" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF3" />
+        <register type="OA" address="0x00002780" value="0x00000000" />
+        <register type="OA" address="0x00002784" value="0x0000FFCF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000FF3F" />
+        <register type="OA" address="0x00002790" value="0x00000000" />
+        <register type="OA" address="0x00002794" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="aa2d6ab4-99b3-42f8-94d6-4a9aa2baedaf"
+       chipset="CNL"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort1"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header11_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader11ReadyPort0"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort1"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice1 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice1 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header10_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader10ReadyPort0"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x12184D60" />
+        <register type="NOA" address="0x00009888" value="0x12384D60" />
+        <register type="NOA" address="0x00009888" value="0x12984D60" />
+        <register type="NOA" address="0x00009888" value="0x12B84D60" />
+        <register type="NOA" address="0x00009888" value="0x12584D60" />
+        <register type="NOA" address="0x00009888" value="0x186C2A00" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0001" />
+        <register type="NOA" address="0x00009888" value="0x00738000" />
+        <register type="NOA" address="0x00009888" value="0x02737000" />
+        <register type="NOA" address="0x00009888" value="0x12740140" />
+        <register type="NOA" address="0x00009888" value="0x1475000A" />
+        <register type="NOA" address="0x00009888" value="0x10760028" />
+        <register type="NOA" address="0x00009888" value="0x16777C00" />
+        <register type="NOA" address="0x00009888" value="0x18770001" />
+        <register type="NOA" address="0x00009888" value="0x02774000" />
+        <register type="NOA" address="0x00009888" value="0x04774000" />
+        <register type="NOA" address="0x00009888" value="0x06778000" />
+        <register type="NOA" address="0x00009888" value="0x08778000" />
+        <register type="NOA" address="0x00009888" value="0x0A778000" />
+        <register type="NOA" address="0x00009888" value="0x0C778000" />
+        <register type="NOA" address="0x00009888" value="0x0C7B0280" />
+        <register type="NOA" address="0x00009888" value="0x087BA000" />
+        <register type="NOA" address="0x00009888" value="0x167C0280" />
+        <register type="NOA" address="0x00009888" value="0x027CC000" />
+        <register type="NOA" address="0x00009888" value="0x047CC000" />
+        <register type="NOA" address="0x00009888" value="0x1E7D2800" />
+        <register type="NOA" address="0x00009888" value="0x1A192000" />
+        <register type="NOA" address="0x00009888" value="0x1C190001" />
+        <register type="NOA" address="0x00009888" value="0x1E140028" />
+        <register type="NOA" address="0x00009888" value="0x0A1500C0" />
+        <register type="NOA" address="0x00009888" value="0x1A164000" />
+        <register type="NOA" address="0x00009888" value="0x1C160002" />
+        <register type="NOA" address="0x00009888" value="0x0C18AFA7" />
+        <register type="NOA" address="0x00009888" value="0x10180000" />
+        <register type="NOA" address="0x00009888" value="0x1C390014" />
+        <register type="NOA" address="0x00009888" value="0x1E340280" />
+        <register type="NOA" address="0x00009888" value="0x0A350300" />
+        <register type="NOA" address="0x00009888" value="0x1C360028" />
+        <register type="NOA" address="0x00009888" value="0x0E38AFA7" />
+        <register type="NOA" address="0x00009888" value="0x10380000" />
+        <register type="NOA" address="0x00009888" value="0x06F48000" />
+        <register type="NOA" address="0x00009888" value="0x08F42000" />
+        <register type="NOA" address="0x00009888" value="0x06F58000" />
+        <register type="NOA" address="0x00009888" value="0x08F52000" />
+        <register type="NOA" address="0x00009888" value="0x0EF6000A" />
+        <register type="NOA" address="0x00009888" value="0x06F7C000" />
+        <register type="NOA" address="0x00009888" value="0x08F7C000" />
+        <register type="NOA" address="0x00009888" value="0x0AF74000" />
+        <register type="NOA" address="0x00009888" value="0x0CF74000" />
+        <register type="NOA" address="0x00009888" value="0x0AFB00A0" />
+        <register type="NOA" address="0x00009888" value="0x0AFC8000" />
+        <register type="NOA" address="0x00009888" value="0x0CFC8000" />
+        <register type="NOA" address="0x00009888" value="0x1CFD0A00" />
+        <register type="NOA" address="0x00009888" value="0x06994000" />
+        <register type="NOA" address="0x00009888" value="0x08994000" />
+        <register type="NOA" address="0x00009888" value="0x1C94000A" />
+        <register type="NOA" address="0x00009888" value="0x08956000" />
+        <register type="NOA" address="0x00009888" value="0x06968000" />
+        <register type="NOA" address="0x00009888" value="0x08968000" />
+        <register type="NOA" address="0x00009888" value="0x0298A700" />
+        <register type="NOA" address="0x00009888" value="0x049800AF" />
+        <register type="NOA" address="0x00009888" value="0x10980000" />
+        <register type="NOA" address="0x00009888" value="0x0AB94000" />
+        <register type="NOA" address="0x00009888" value="0x0CB94000" />
+        <register type="NOA" address="0x00009888" value="0x1CB400A0" />
+        <register type="NOA" address="0x00009888" value="0x08B58000" />
+        <register type="NOA" address="0x00009888" value="0x0AB50001" />
+        <register type="NOA" address="0x00009888" value="0x0AB68000" />
+        <register type="NOA" address="0x00009888" value="0x0CB68000" />
+        <register type="NOA" address="0x00009888" value="0x04B8A700" />
+        <register type="NOA" address="0x00009888" value="0x06B800AF" />
+        <register type="NOA" address="0x00009888" value="0x10B80000" />
+        <register type="NOA" address="0x00009888" value="0x02594000" />
+        <register type="NOA" address="0x00009888" value="0x04594000" />
+        <register type="NOA" address="0x00009888" value="0x1A54A000" />
+        <register type="NOA" address="0x00009888" value="0x00558000" />
+        <register type="NOA" address="0x00009888" value="0x08551000" />
+        <register type="NOA" address="0x00009888" value="0x02568000" />
+        <register type="NOA" address="0x00009888" value="0x04568000" />
+        <register type="NOA" address="0x00009888" value="0x0058A700" />
+        <register type="NOA" address="0x00009888" value="0x025800AF" />
+        <register type="NOA" address="0x00009888" value="0x10580000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x21003000" />
+        <register type="NOA" address="0x00009888" value="0x27000071" />
+        <register type="NOA" address="0x00009888" value="0x33000000" />
+        <register type="NOA" address="0x00009888" value="0x2900C000" />
+        <register type="NOA" address="0x00009888" value="0x2B00C000" />
+        <register type="NOA" address="0x00009888" value="0x2D00C000" />
+        <register type="NOA" address="0x00009888" value="0x2F00C000" />
+        <register type="NOA" address="0x00009888" value="0x1300C000" />
+        <register type="NOA" address="0x00009888" value="0x1500C000" />
+        <register type="NOA" address="0x00009888" value="0x1700C000" />
+        <register type="NOA" address="0x00009888" value="0x1900C000" />
+        <register type="NOA" address="0x00009888" value="0x1B00C000" />
+        <register type="NOA" address="0x00009888" value="0x1D00C000" />
+        <register type="NOA" address="0x00009888" value="0x4B003000" />
+        <register type="NOA" address="0x00009888" value="0x3F002C00" />
+        <register type="NOA" address="0x00009888" value="0x4D001111" />
+        <register type="NOA" address="0x00009888" value="0x41000421" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+        <register type="NOA" address="0x00009888" value="0x43000001" />
+        <register type="NOA" address="0x00009888" value="0x47000000" />
+        <register type="NOA" address="0x00009888" value="0x39001080" />
+        <register type="NOA" address="0x00009888" value="0x3B000000" />
+        <register type="NOA" address="0x00009888" value="0x49000000" />
+        <register type="NOA" address="0x00009888" value="0x3D000000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TestOa"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="db41edd4-d8e7-4730-ad11-b9a2d6833503"
+       chipset="CNL"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.6666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.16666"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x17060000" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x13034000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x07060066" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x05060000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x0F080040" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x07091000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x0F041000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x1D004000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x35000000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x49000000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x3D000000" />
+        <register type="NOA" address="0x00009884" value="0x00000007" />
+        <register type="NOA" address="0x00009888" value="0x31000000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x0000FFFF" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFF" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x0000FFFF" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-glk.xml b/lib/i915/perf-configs/oa-glk.xml
new file mode 100644
index 00000000..94dff61a
--- /dev/null
+++ b/lib/i915/perf-configs/oa-glk.xml
@@ -0,0 +1,9346 @@
+<?xml version="1.0"?>
+<metrics version="1562317148" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="d72df5c7-5b4a-4274-a43f-00b0fd51fc68"
+       chipset="GLK"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C00F0" />
+        <register type="NOA" address="0x00009888" value="0x12120280" />
+        <register type="NOA" address="0x00009888" value="0x12320280" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x419000A0" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0800" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5900" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C4000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0010" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FCC00" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0002" />
+        <register type="NOA" address="0x00009888" value="0x1C2C0040" />
+        <register type="NOA" address="0x00009888" value="0x00101000" />
+        <register type="NOA" address="0x00009888" value="0x04101000" />
+        <register type="NOA" address="0x00009888" value="0x00114000" />
+        <register type="NOA" address="0x00009888" value="0x08114000" />
+        <register type="NOA" address="0x00009888" value="0x00120020" />
+        <register type="NOA" address="0x00009888" value="0x08120021" />
+        <register type="NOA" address="0x00009888" value="0x00141000" />
+        <register type="NOA" address="0x00009888" value="0x08141000" />
+        <register type="NOA" address="0x00009888" value="0x02308000" />
+        <register type="NOA" address="0x00009888" value="0x04302000" />
+        <register type="NOA" address="0x00009888" value="0x06318000" />
+        <register type="NOA" address="0x00009888" value="0x08318000" />
+        <register type="NOA" address="0x00009888" value="0x06320800" />
+        <register type="NOA" address="0x00009888" value="0x08320840" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x06344000" />
+        <register type="NOA" address="0x00009888" value="0x08344000" />
+        <register type="NOA" address="0x00009888" value="0x0D931831" />
+        <register type="NOA" address="0x00009888" value="0x0F939F3F" />
+        <register type="NOA" address="0x00009888" value="0x01939E80" />
+        <register type="NOA" address="0x00009888" value="0x039303BC" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1993002A" />
+        <register type="NOA" address="0x00009888" value="0x07930000" />
+        <register type="NOA" address="0x00009888" value="0x09930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900177" />
+        <register type="NOA" address="0x00009888" value="0x1F900187" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x53901110" />
+        <register type="NOA" address="0x00009888" value="0x43900423" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900C02" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900020" />
+        <register type="NOA" address="0x00009888" value="0x59901111" />
+        <register type="NOA" address="0x00009888" value="0x4B900421" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="814285f6-354d-41d2-ba49-e24e622714a0"
+       chipset="GLK"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL  $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x002D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D4000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E1400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5100" />
+        <register type="NOA" address="0x00009888" value="0x102E0114" />
+        <register type="NOA" address="0x00009888" value="0x044CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C4000" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x004EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F6B42" />
+        <register type="NOA" address="0x00009888" value="0x064F6200" />
+        <register type="NOA" address="0x00009888" value="0x084F4100" />
+        <register type="NOA" address="0x00009888" value="0x0A4F0061" />
+        <register type="NOA" address="0x00009888" value="0x0C4F6C4C" />
+        <register type="NOA" address="0x00009888" value="0x0E4F4B00" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0000" />
+        <register type="NOA" address="0x00009888" value="0x180F5000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F8800" />
+        <register type="NOA" address="0x00009888" value="0x1C0F08A2" />
+        <register type="NOA" address="0x00009888" value="0x182C4000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C1451" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0010" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x19938A28" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x19900177" />
+        <register type="NOA" address="0x00009888" value="0x1B900178" />
+        <register type="NOA" address="0x00009888" value="0x1D900125" />
+        <register type="NOA" address="0x00009888" value="0x1F900123" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x53901000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="07d397a6-b3e6-49f6-9433-a4f293d55978"
+       chipset="GLK"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C2E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A2F0000" />
+        <register type="NOA" address="0x00009888" value="0x10186800" />
+        <register type="NOA" address="0x00009888" value="0x11810019" />
+        <register type="NOA" address="0x00009888" value="0x15810013" />
+        <register type="NOA" address="0x00009888" value="0x13820020" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x17840000" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x21860000" />
+        <register type="NOA" address="0x00009888" value="0x178703E0" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x022E5400" />
+        <register type="NOA" address="0x00009888" value="0x002E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0080" />
+        <register type="NOA" address="0x00009888" value="0x082F0040" />
+        <register type="NOA" address="0x00009888" value="0x002F0000" />
+        <register type="NOA" address="0x00009888" value="0x06143000" />
+        <register type="NOA" address="0x00009888" value="0x06174000" />
+        <register type="NOA" address="0x00009888" value="0x06180012" />
+        <register type="NOA" address="0x00009888" value="0x00180000" />
+        <register type="NOA" address="0x00009888" value="0x0D804000" />
+        <register type="NOA" address="0x00009888" value="0x0F804000" />
+        <register type="NOA" address="0x00009888" value="0x05804000" />
+        <register type="NOA" address="0x00009888" value="0x09810200" />
+        <register type="NOA" address="0x00009888" value="0x0B810030" />
+        <register type="NOA" address="0x00009888" value="0x03810003" />
+        <register type="NOA" address="0x00009888" value="0x21819140" />
+        <register type="NOA" address="0x00009888" value="0x23819050" />
+        <register type="NOA" address="0x00009888" value="0x25810018" />
+        <register type="NOA" address="0x00009888" value="0x0B820980" />
+        <register type="NOA" address="0x00009888" value="0x03820D80" />
+        <register type="NOA" address="0x00009888" value="0x11820000" />
+        <register type="NOA" address="0x00009888" value="0x0182C000" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x09824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0D830004" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x0F831000" />
+        <register type="NOA" address="0x00009888" value="0x01848072" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x07848000" />
+        <register type="NOA" address="0x00009888" value="0x09844000" />
+        <register type="NOA" address="0x00009888" value="0x0F848000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x09860092" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x01869100" />
+        <register type="NOA" address="0x00009888" value="0x0F870065" />
+        <register type="NOA" address="0x00009888" value="0x01870000" />
+        <register type="NOA" address="0x00009888" value="0x19930800" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1B952000" />
+        <register type="NOA" address="0x00009888" value="0x1D955055" />
+        <register type="NOA" address="0x00009888" value="0x1F951455" />
+        <register type="NOA" address="0x00009888" value="0x0992A000" />
+        <register type="NOA" address="0x00009888" value="0x0F928000" />
+        <register type="NOA" address="0x00009888" value="0x1192A800" />
+        <register type="NOA" address="0x00009888" value="0x1392028A" />
+        <register type="NOA" address="0x00009888" value="0x0B92A000" />
+        <register type="NOA" address="0x00009888" value="0x0D922000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C01" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900863" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900061" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C22" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="1a356946-5428-450b-a2f0-89f8783a302d"
+       chipset="GLK"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800343" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x41900003" />
+        <register type="NOA" address="0x00009888" value="0x03803180" />
+        <register type="NOA" address="0x00009888" value="0x058035E2" />
+        <register type="NOA" address="0x00009888" value="0x0780006A" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x2181A000" />
+        <register type="NOA" address="0x00009888" value="0x2381000A" />
+        <register type="NOA" address="0x00009888" value="0x1D950550" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D92A000" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x13900170" />
+        <register type="NOA" address="0x00009888" value="0x21900171" />
+        <register type="NOA" address="0x00009888" value="0x23900172" />
+        <register type="NOA" address="0x00009888" value="0x25900173" />
+        <register type="NOA" address="0x00009888" value="0x27900174" />
+        <register type="NOA" address="0x00009888" value="0x29900175" />
+        <register type="NOA" address="0x00009888" value="0x2B900176" />
+        <register type="NOA" address="0x00009888" value="0x2D900177" />
+        <register type="NOA" address="0x00009888" value="0x2F90017F" />
+        <register type="NOA" address="0x00009888" value="0x31900125" />
+        <register type="NOA" address="0x00009888" value="0x15900123" />
+        <register type="NOA" address="0x00009888" value="0x17900121" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47901080" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49901084" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B901084" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900004" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="5299be9d-7a61-4c99-9f81-f87e6c5aaca9"
+       chipset="GLK"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800343" />
+        <register type="NOA" address="0x00009888" value="0x39900340" />
+        <register type="NOA" address="0x00009888" value="0x3F900000" />
+        <register type="NOA" address="0x00009888" value="0x41900080" />
+        <register type="NOA" address="0x00009888" value="0x03803180" />
+        <register type="NOA" address="0x00009888" value="0x058035E2" />
+        <register type="NOA" address="0x00009888" value="0x0780006A" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x2181A000" />
+        <register type="NOA" address="0x00009888" value="0x2381000A" />
+        <register type="NOA" address="0x00009888" value="0x1D950550" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D92A000" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x13900180" />
+        <register type="NOA" address="0x00009888" value="0x21900181" />
+        <register type="NOA" address="0x00009888" value="0x23900182" />
+        <register type="NOA" address="0x00009888" value="0x25900183" />
+        <register type="NOA" address="0x00009888" value="0x27900184" />
+        <register type="NOA" address="0x00009888" value="0x29900185" />
+        <register type="NOA" address="0x00009888" value="0x2B900186" />
+        <register type="NOA" address="0x00009888" value="0x2D900187" />
+        <register type="NOA" address="0x00009888" value="0x2F900170" />
+        <register type="NOA" address="0x00009888" value="0x31900125" />
+        <register type="NOA" address="0x00009888" value="0x15900123" />
+        <register type="NOA" address="0x00009888" value="0x17900121" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47901080" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49901084" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B901084" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900004" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="bc9bcff2-459a-4cbc-986d-a84b077153f3"
+       chipset="GLK"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C0160" />
+        <register type="NOA" address="0x00009888" value="0x161C0015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x002D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5515" />
+        <register type="NOA" address="0x00009888" value="0x102E0155" />
+        <register type="NOA" address="0x00009888" value="0x044CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E4CC000" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x004EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084EA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4F4B41" />
+        <register type="NOA" address="0x00009888" value="0x004F4200" />
+        <register type="NOA" address="0x00009888" value="0x024F404C" />
+        <register type="NOA" address="0x00009888" value="0x1C4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0A1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0031" />
+        <register type="NOA" address="0x00009888" value="0x061C1900" />
+        <register type="NOA" address="0x00009888" value="0x081C1A33" />
+        <register type="NOA" address="0x00009888" value="0x0A1C1B35" />
+        <register type="NOA" address="0x00009888" value="0x0C1C3337" />
+        <register type="NOA" address="0x00009888" value="0x041C31C7" />
+        <register type="NOA" address="0x00009888" value="0x180F5000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FA8AA" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0AAA" />
+        <register type="NOA" address="0x00009888" value="0x182C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C6AAA" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C2950" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x1993AAAA" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900400" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="88ec931f-5b4a-453a-9db6-a61232b6143d"
+       chipset="GLK"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C03B0" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900C00" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E1500" />
+        <register type="NOA" address="0x00009888" value="0x102E0140" />
+        <register type="NOA" address="0x00009888" value="0x044C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4CC000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x004E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x1A4F4001" />
+        <register type="NOA" address="0x00009888" value="0x1C4F5005" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x180F1000" />
+        <register type="NOA" address="0x00009888" value="0x1A0FA800" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C4000" />
+        <register type="NOA" address="0x00009888" value="0x1C2C4015" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x03931980" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x1993A00A" />
+        <register type="NOA" address="0x00009888" value="0x07930000" />
+        <register type="NOA" address="0x00009888" value="0x09930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900177" />
+        <register type="NOA" address="0x00009888" value="0x1F900178" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x53901000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="0329ea02-ebb8-43f1-bf89-c5bdcccd3eb4"
+       chipset="GLK"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x022D4000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0055" />
+        <register type="NOA" address="0x00009888" value="0x064C8000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x024F6100" />
+        <register type="NOA" address="0x00009888" value="0x044F416B" />
+        <register type="NOA" address="0x00009888" value="0x064F004B" />
+        <register type="NOA" address="0x00009888" value="0x1A4F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F02A8" />
+        <register type="NOA" address="0x00009888" value="0x1A2C5500" />
+        <register type="NOA" address="0x00009888" value="0x0F808000" />
+        <register type="NOA" address="0x00009888" value="0x25810020" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1F951000" />
+        <register type="NOA" address="0x00009888" value="0x13920200" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="5e57a25a-1d18-4e94-b84b-08ea66751b8c"
+       chipset="GLK"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12643400" />
+        <register type="NOA" address="0x00009888" value="0x12653400" />
+        <register type="NOA" address="0x00009888" value="0x106C6800" />
+        <register type="NOA" address="0x00009888" value="0x126C001E" />
+        <register type="NOA" address="0x00009888" value="0x166C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E0154" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0055" />
+        <register type="NOA" address="0x00009888" value="0x104C8000" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4EA000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C4F5500" />
+        <register type="NOA" address="0x00009888" value="0x1A4F1554" />
+        <register type="NOA" address="0x00009888" value="0x0A640024" />
+        <register type="NOA" address="0x00009888" value="0x10640000" />
+        <register type="NOA" address="0x00009888" value="0x04640000" />
+        <register type="NOA" address="0x00009888" value="0x0C650024" />
+        <register type="NOA" address="0x00009888" value="0x10650000" />
+        <register type="NOA" address="0x00009888" value="0x06650000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0900" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0AA0" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F02AA" />
+        <register type="NOA" address="0x00009888" value="0x1C2C5400" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0001" />
+        <register type="NOA" address="0x00009888" value="0x1A2C5550" />
+        <register type="NOA" address="0x00009888" value="0x1993AA00" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900421" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="f0652373-d361-426f-b36d-9ffec288bdc6"
+       chipset="GLK"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102D7800" />
+        <register type="NOA" address="0x00009888" value="0x122D79E0" />
+        <register type="NOA" address="0x00009888" value="0x0C2F0004" />
+        <register type="NOA" address="0x00009888" value="0x100E3800" />
+        <register type="NOA" address="0x00009888" value="0x180F0005" />
+        <register type="NOA" address="0x00009888" value="0x002D0940" />
+        <register type="NOA" address="0x00009888" value="0x022D802F" />
+        <register type="NOA" address="0x00009888" value="0x042D4013" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0050" />
+        <register type="NOA" address="0x00009888" value="0x022F0010" />
+        <register type="NOA" address="0x00009888" value="0x002F0000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x040E0480" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x060F0027" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F0040" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x439014A0" />
+        <register type="NOA" address="0x00009888" value="0x459000A4" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="6ac97d12-ce13-428a-b20c-6902bde2608b"
+       chipset="GLK"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121300A0" />
+        <register type="NOA" address="0x00009888" value="0x141600AB" />
+        <register type="NOA" address="0x00009888" value="0x123300A0" />
+        <register type="NOA" address="0x00009888" value="0x143600AB" />
+        <register type="NOA" address="0x00009888" value="0x125300A0" />
+        <register type="NOA" address="0x00009888" value="0x145600AB" />
+        <register type="NOA" address="0x00009888" value="0x0C2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E01A0" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0065" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x084C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x044E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F023F" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0003" />
+        <register type="NOA" address="0x00009888" value="0x1A2CC030" />
+        <register type="NOA" address="0x00009888" value="0x04132180" />
+        <register type="NOA" address="0x00009888" value="0x02130000" />
+        <register type="NOA" address="0x00009888" value="0x0C148000" />
+        <register type="NOA" address="0x00009888" value="0x0E142000" />
+        <register type="NOA" address="0x00009888" value="0x04148000" />
+        <register type="NOA" address="0x00009888" value="0x1E150140" />
+        <register type="NOA" address="0x00009888" value="0x1C150040" />
+        <register type="NOA" address="0x00009888" value="0x0C163000" />
+        <register type="NOA" address="0x00009888" value="0x0E160068" />
+        <register type="NOA" address="0x00009888" value="0x10160000" />
+        <register type="NOA" address="0x00009888" value="0x18160000" />
+        <register type="NOA" address="0x00009888" value="0x0A164000" />
+        <register type="NOA" address="0x00009888" value="0x04330043" />
+        <register type="NOA" address="0x00009888" value="0x02330000" />
+        <register type="NOA" address="0x00009888" value="0x0234A000" />
+        <register type="NOA" address="0x00009888" value="0x04342000" />
+        <register type="NOA" address="0x00009888" value="0x1C350015" />
+        <register type="NOA" address="0x00009888" value="0x02363460" />
+        <register type="NOA" address="0x00009888" value="0x10360000" />
+        <register type="NOA" address="0x00009888" value="0x04360000" />
+        <register type="NOA" address="0x00009888" value="0x06360000" />
+        <register type="NOA" address="0x00009888" value="0x08364000" />
+        <register type="NOA" address="0x00009888" value="0x06530043" />
+        <register type="NOA" address="0x00009888" value="0x02530000" />
+        <register type="NOA" address="0x00009888" value="0x0E548000" />
+        <register type="NOA" address="0x00009888" value="0x00548000" />
+        <register type="NOA" address="0x00009888" value="0x06542000" />
+        <register type="NOA" address="0x00009888" value="0x1E550400" />
+        <register type="NOA" address="0x00009888" value="0x1A552000" />
+        <register type="NOA" address="0x00009888" value="0x1C550100" />
+        <register type="NOA" address="0x00009888" value="0x0E563000" />
+        <register type="NOA" address="0x00009888" value="0x00563400" />
+        <register type="NOA" address="0x00009888" value="0x10560000" />
+        <register type="NOA" address="0x00009888" value="0x18560000" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x0C564000" />
+        <register type="NOA" address="0x00009888" value="0x1993A800" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B9014A0" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900001" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900820" />
+        <register type="NOA" address="0x00009888" value="0x45901022" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="59ea703a-9a35-4aed-a985-0d9ab7aceaba"
+       chipset="GLK"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A0000" />
+        <register type="NOA" address="0x00009888" value="0x143A0000" />
+        <register type="NOA" address="0x00009888" value="0x145A0000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D5000" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x102E0150" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E006A" />
+        <register type="NOA" address="0x00009888" value="0x124C8000" />
+        <register type="NOA" address="0x00009888" value="0x144C8000" />
+        <register type="NOA" address="0x00009888" value="0x164C2000" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4EA000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024E2000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x1C0F0BC0" />
+        <register type="NOA" address="0x00009888" value="0x180F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F0302" />
+        <register type="NOA" address="0x00009888" value="0x1E2C0003" />
+        <register type="NOA" address="0x00009888" value="0x1A2C00F0" />
+        <register type="NOA" address="0x00009888" value="0x021A3080" />
+        <register type="NOA" address="0x00009888" value="0x041A31E5" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x0414A000" />
+        <register type="NOA" address="0x00009888" value="0x1C150054" />
+        <register type="NOA" address="0x00009888" value="0x06168000" />
+        <register type="NOA" address="0x00009888" value="0x08168000" />
+        <register type="NOA" address="0x00009888" value="0x0A168000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A3280" />
+        <register type="NOA" address="0x00009888" value="0x0E3A0063" />
+        <register type="NOA" address="0x00009888" value="0x063A0061" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x0C348000" />
+        <register type="NOA" address="0x00009888" value="0x0E342000" />
+        <register type="NOA" address="0x00009888" value="0x06342000" />
+        <register type="NOA" address="0x00009888" value="0x1E350140" />
+        <register type="NOA" address="0x00009888" value="0x1C350100" />
+        <register type="NOA" address="0x00009888" value="0x18360028" />
+        <register type="NOA" address="0x00009888" value="0x0C368000" />
+        <register type="NOA" address="0x00009888" value="0x0E5A3080" />
+        <register type="NOA" address="0x00009888" value="0x005A3280" />
+        <register type="NOA" address="0x00009888" value="0x025A0063" />
+        <register type="NOA" address="0x00009888" value="0x0E548000" />
+        <register type="NOA" address="0x00009888" value="0x00548000" />
+        <register type="NOA" address="0x00009888" value="0x02542000" />
+        <register type="NOA" address="0x00009888" value="0x1E550400" />
+        <register type="NOA" address="0x00009888" value="0x1A552000" />
+        <register type="NOA" address="0x00009888" value="0x1C550001" />
+        <register type="NOA" address="0x00009888" value="0x18560080" />
+        <register type="NOA" address="0x00009888" value="0x02568000" />
+        <register type="NOA" address="0x00009888" value="0x04568000" />
+        <register type="NOA" address="0x00009888" value="0x1993A800" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x2D904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4D900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x45901084" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="f2d6d718-e7b1-48f4-9624-45230d2fe2a0"
+       chipset="GLK"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A026B" />
+        <register type="NOA" address="0x00009888" value="0x143A0173" />
+        <register type="NOA" address="0x00009888" value="0x145A026B" />
+        <register type="NOA" address="0x00009888" value="0x002D4000" />
+        <register type="NOA" address="0x00009888" value="0x022D5000" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E5000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0069" />
+        <register type="NOA" address="0x00009888" value="0x044C8000" />
+        <register type="NOA" address="0x00009888" value="0x064CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C4000" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x024EA000" />
+        <register type="NOA" address="0x00009888" value="0x064E2000" />
+        <register type="NOA" address="0x00009888" value="0x180F6000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F030A" />
+        <register type="NOA" address="0x00009888" value="0x1A2C03C0" />
+        <register type="NOA" address="0x00009888" value="0x041A37E7" />
+        <register type="NOA" address="0x00009888" value="0x021A0000" />
+        <register type="NOA" address="0x00009888" value="0x0414A000" />
+        <register type="NOA" address="0x00009888" value="0x1C150050" />
+        <register type="NOA" address="0x00009888" value="0x08168000" />
+        <register type="NOA" address="0x00009888" value="0x0A168000" />
+        <register type="NOA" address="0x00009888" value="0x003A3380" />
+        <register type="NOA" address="0x00009888" value="0x063A006F" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x00348000" />
+        <register type="NOA" address="0x00009888" value="0x06342000" />
+        <register type="NOA" address="0x00009888" value="0x1A352000" />
+        <register type="NOA" address="0x00009888" value="0x1C350100" />
+        <register type="NOA" address="0x00009888" value="0x02368000" />
+        <register type="NOA" address="0x00009888" value="0x0C368000" />
+        <register type="NOA" address="0x00009888" value="0x025A37E7" />
+        <register type="NOA" address="0x00009888" value="0x0254A000" />
+        <register type="NOA" address="0x00009888" value="0x1C550005" />
+        <register type="NOA" address="0x00009888" value="0x04568000" />
+        <register type="NOA" address="0x00009888" value="0x06568000" />
+        <register type="NOA" address="0x00009888" value="0x03938000" />
+        <register type="NOA" address="0x00009888" value="0x05938000" />
+        <register type="NOA" address="0x00009888" value="0x07938000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17904000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900020" />
+        <register type="NOA" address="0x00009888" value="0x45901080" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="15274c82-27d2-4819-876a-7cb1a2c59ba4"
+       chipset="GLK"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A001F" />
+        <register type="NOA" address="0x00009888" value="0x143A001F" />
+        <register type="NOA" address="0x00009888" value="0x145A001F" />
+        <register type="NOA" address="0x00009888" value="0x042D5000" />
+        <register type="NOA" address="0x00009888" value="0x062D1000" />
+        <register type="NOA" address="0x00009888" value="0x0E2E0094" />
+        <register type="NOA" address="0x00009888" value="0x084CC000" />
+        <register type="NOA" address="0x00009888" value="0x044EA000" />
+        <register type="NOA" address="0x00009888" value="0x1A0F00E0" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0C00" />
+        <register type="NOA" address="0x00009888" value="0x061A0063" />
+        <register type="NOA" address="0x00009888" value="0x021A0000" />
+        <register type="NOA" address="0x00009888" value="0x06142000" />
+        <register type="NOA" address="0x00009888" value="0x1C150100" />
+        <register type="NOA" address="0x00009888" value="0x0C168000" />
+        <register type="NOA" address="0x00009888" value="0x043A3180" />
+        <register type="NOA" address="0x00009888" value="0x023A0000" />
+        <register type="NOA" address="0x00009888" value="0x04348000" />
+        <register type="NOA" address="0x00009888" value="0x1C350040" />
+        <register type="NOA" address="0x00009888" value="0x0A368000" />
+        <register type="NOA" address="0x00009888" value="0x045A0063" />
+        <register type="NOA" address="0x00009888" value="0x025A0000" />
+        <register type="NOA" address="0x00009888" value="0x04542000" />
+        <register type="NOA" address="0x00009888" value="0x1C550010" />
+        <register type="NOA" address="0x00009888" value="0x08568000" />
+        <register type="NOA" address="0x00009888" value="0x09938000" />
+        <register type="NOA" address="0x00009888" value="0x0B938000" />
+        <register type="NOA" address="0x00009888" value="0x0D938000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D904000" />
+        <register type="NOA" address="0x00009888" value="0x1F904000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900004" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="dd3fd789-e783-4204-8cd0-b671bbccb0cf"
+       chipset="GLK"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19800000" />
+        <register type="NOA" address="0x00009888" value="0x07800063" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x23810008" />
+        <register type="NOA" address="0x00009888" value="0x1D950400" />
+        <register type="NOA" address="0x00009888" value="0x0F922000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="e6868953-fb47-431d-a060-f785916558fc"
+       chipset="GLK"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x124C3080" />
+        <register type="NOA" address="0x00009888" value="0x002D1000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x082D5000" />
+        <register type="NOA" address="0x00009888" value="0x0A2D5000" />
+        <register type="NOA" address="0x00009888" value="0x0C2E0400" />
+        <register type="NOA" address="0x00009888" value="0x0E2E5500" />
+        <register type="NOA" address="0x00009888" value="0x102E0001" />
+        <register type="NOA" address="0x00009888" value="0x004C0045" />
+        <register type="NOA" address="0x00009888" value="0x064C2300" />
+        <register type="NOA" address="0x00009888" value="0x084C26C4" />
+        <register type="NOA" address="0x00009888" value="0x0A4C264E" />
+        <register type="NOA" address="0x00009888" value="0x164C0000" />
+        <register type="NOA" address="0x00009888" value="0x044C0000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E4C0000" />
+        <register type="NOA" address="0x00009888" value="0x01938000" />
+        <register type="NOA" address="0x00009888" value="0x0F938000" />
+        <register type="NOA" address="0x00009888" value="0x199300AA" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29904000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-hsw.xml b/lib/i915/perf-configs/oa-hsw.xml
new file mode 100644
index 00000000..a95c6f5a
--- /dev/null
+++ b/lib/i915/perf-configs/oa-hsw.xml
@@ -0,0 +1,4615 @@
+<?xml version="1.0"?>
+<metrics version="1562317146" merge_md5="">
+  <set name="Render Metrics Basic Gen7.5"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="a490e9d2-55b3-4db0-8dab-53011032c5f3"
+       chipset="HSW"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Stall"
+             description="The percentage of time in which evaluation shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_stall"
+             units="percent"
+             symbol_name="DsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Alpha Test Fails"
+             description="The total number of pixels dropped on post-FS alpha test."
+             data_type="uint64"
+             equation="A 37 READ"
+             underscore_name="alpha_test_fails"
+             units="pixels"
+             symbol_name="AlphaTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which sampler 1 was bottlenecks."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="TES Threads Dispatched"
+             description="The total number of evaluation shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 15 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="TES AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 12 READ $DsThreads UDIV"
+             underscore_name="ds_eu_active_per_thread"
+             units="cycles"
+             symbol_name="DsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 25 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GS EU Stall"
+             description="The percentage of time in which geometry shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 23 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_stall"
+             units="percent"
+             symbol_name="GsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Active"
+             description="The percentage of time in which compute shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_active"
+             units="percent"
+             symbol_name="CsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 2 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS EU Active"
+             description="The percentage of time in which control shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_active"
+             units="percent"
+             symbol_name="HsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Active"
+             description="The percentage of time in which evaluation shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_active"
+             units="percent"
+             symbol_name="DsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS EU Active"
+             description="The percentage of time in which geometry shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 22 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_active"
+             units="percent"
+             symbol_name="GsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 27 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Stall"
+             description="The percentage of time in which compute shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_stall"
+             units="percent"
+             symbol_name="CsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 1 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 3 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS EU Stall"
+             description="The percentage of time in which control shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_stall"
+             units="percent"
+             symbol_name="HsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 28 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="CS Duration"
+             description="Total Compute Shader GPU duration."
+             data_type="uint64"
+             equation="A 17 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 18 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="cs_duration"
+             units="us"
+             symbol_name="CsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 30 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which sampler 0 was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which sampler 1 was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers were busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ  B 1 READ UADD $GpuCoreClocks FDIV 2 FDIV 100 FMUL"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES Duration"
+             description="Total Evaluation Shader GPU duration."
+             data_type="uint64"
+             equation="A 12 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 13 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="ds_duration"
+             units="us"
+             symbol_name="DsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 1 READ 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 128 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="CS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 17 READ $CsThreads UDIV"
+             underscore_name="cs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="CsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which sampler 0 was bottlenecks."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 23 READ $GsThreads UDIV"
+             underscore_name="gs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="GsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Sampler 0 Texels LOD0"
+             description="The total number of texels lookups in LOD0 in sampler 0 unit."
+             data_type="uint64"
+             equation="B 4 READ 4 UMUL"
+             underscore_name="sampler0_texels"
+             units="texels"
+             symbol_name="Sampler0Texels"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler"
+             />
+    <counter name="Sampler 1 Texels LOD0"
+             description="The total number of texels lookups in LOD0 in sampler 1 unit."
+             data_type="uint64"
+             equation="B 5 READ 4 UMUL"
+             underscore_name="sampler1_texels"
+             units="texels"
+             symbol_name="Sampler1Texels"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler"
+             />
+    <counter name="Sampler Texels LOD0"
+             description="The total number of texels lookups in LOD0 in all sampler units."
+             data_type="uint64"
+             equation="$Sampler0Texels $Sampler1Texels UADD $EuSlicesTotalCount UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="GS Duration"
+             description="Total Geometry Shader GPU duration."
+             data_type="uint64"
+             equation="A 22 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 23 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="gs_duration"
+             units="us"
+             symbol_name="GsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Idle"
+             description="The percentage of time in which the Execution Units were idle."
+             data_type="float"
+             max_equation="100"
+             equation="100 $EuActive $EuStall FADD FSUB"
+             underscore_name="eu_idle"
+             units="percent"
+             symbol_name="EuIdle"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 28 READ $PsThreads UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 3 READ $VsThreads UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="C 5 READ $EuSlicesTotalCount 4 UMUL UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has being processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 41 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 27 READ $PsThreads UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="TCS Duration"
+             description="Total Control Shader GPU duration."
+             data_type="uint64"
+             equation="A 7 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 8 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="hs_duration"
+             units="us"
+             symbol_name="HsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TES AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 13 READ $DsThreads UDIV"
+             underscore_name="ds_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="DsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 22 READ $GsThreads UDIV"
+             underscore_name="gs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="GsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS Threads Dispatched"
+             description="The total number of control shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 10 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 8 READ $HsThreads UDIV"
+             underscore_name="hs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="HsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 36 READ"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Late Depth Test Fails"
+             description="The total number of pixels dropped on post-FS depth test."
+             data_type="uint64"
+             equation="A 39 READ $SamplesKilledInPs USUB"
+             underscore_name="post_ps_depth_test_fails"
+             units="pixels"
+             symbol_name="PostPsDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Sampler Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers were bottlenecks."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 7 READ $HsThreads UDIV"
+             underscore_name="hs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="HsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Duration"
+             description="Total Fragment Shader GPU duration."
+             data_type="uint64"
+             equation="A 27 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 28 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="ps_duration"
+             units="us"
+             symbol_name="PsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 33 READ"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="CS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 18 READ $CsThreads UDIV"
+             underscore_name="cs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="CsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Late Stencil Test Fails"
+             description="The total number of pixels dropped on post-FS stencil test."
+             data_type="uint64"
+             equation="A 38 READ"
+             underscore_name="post_ps_stencil_test_fails"
+             units="pixels"
+             symbol_name="PostPsStencilTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="LLC GPU Throughput"
+             description="The total number of GPU memory bytes transferred between GPU and LLC."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="PERFCNT1 READ_REG C 7 READ USUB 64 UMUL"
+             underscore_name="llc_gpu_throughput"
+             units="bytes"
+             symbol_name="LlcGpuThroughput"
+             availability="true $QueryMode &&"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="LLC"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 3 READ 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ UADD 2 UMUL $EuSlicesTotalCount UMUL 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 2 READ $VsThreads UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Duration"
+             description="Total Vertex Shader GPU duration."
+             data_type="uint64"
+             equation="A 2 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 3 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="vs_duration"
+             units="us"
+             symbol_name="VsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 40 READ"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000253A4" value="0x01600000" />
+        <register type="NOA" address="0x00025440" value="0x00100000" />
+        <register type="NOA" address="0x00025128" value="0x00000000" />
+        <register type="NOA" address="0x0002691C" value="0x00000800" />
+        <register type="NOA" address="0x00026AA0" value="0x01500000" />
+        <register type="NOA" address="0x00026B9C" value="0x00006000" />
+        <register type="NOA" address="0x0002791C" value="0x00000800" />
+        <register type="NOA" address="0x00027AA0" value="0x01500000" />
+        <register type="NOA" address="0x00027B9C" value="0x00006000" />
+        <register type="NOA" address="0x0002641C" value="0x00000400" />
+        <register type="NOA" address="0x00025380" value="0x00000010" />
+        <register type="NOA" address="0x0002538C" value="0x00000000" />
+        <register type="NOA" address="0x00025384" value="0x0800AAAA" />
+        <register type="NOA" address="0x00025400" value="0x00000004" />
+        <register type="NOA" address="0x0002540C" value="0x06029000" />
+        <register type="NOA" address="0x00025410" value="0x00000002" />
+        <register type="NOA" address="0x00025404" value="0x5C30FFFF" />
+        <register type="NOA" address="0x00025100" value="0x00000016" />
+        <register type="NOA" address="0x00025110" value="0x00000400" />
+        <register type="NOA" address="0x00025104" value="0x00000000" />
+        <register type="NOA" address="0x00026804" value="0x00001211" />
+        <register type="NOA" address="0x00026884" value="0x00000100" />
+        <register type="NOA" address="0x00026900" value="0x00000002" />
+        <register type="NOA" address="0x00026908" value="0x00700000" />
+        <register type="NOA" address="0x00026904" value="0x00000000" />
+        <register type="NOA" address="0x00026984" value="0x00001022" />
+        <register type="NOA" address="0x00026A04" value="0x00000011" />
+        <register type="NOA" address="0x00026A80" value="0x00000006" />
+        <register type="NOA" address="0x00026A88" value="0x00000C02" />
+        <register type="NOA" address="0x00026A84" value="0x00000000" />
+        <register type="NOA" address="0x00026B04" value="0x00001000" />
+        <register type="NOA" address="0x00026B80" value="0x00000002" />
+        <register type="NOA" address="0x00026B8C" value="0x00000007" />
+        <register type="NOA" address="0x00026B84" value="0x00000000" />
+        <register type="NOA" address="0x00027804" value="0x00004844" />
+        <register type="NOA" address="0x00027884" value="0x00000400" />
+        <register type="NOA" address="0x00027900" value="0x00000002" />
+        <register type="NOA" address="0x00027908" value="0x0E000000" />
+        <register type="NOA" address="0x00027904" value="0x00000000" />
+        <register type="NOA" address="0x00027984" value="0x00004088" />
+        <register type="NOA" address="0x00027A04" value="0x00000044" />
+        <register type="NOA" address="0x00027A80" value="0x00000006" />
+        <register type="NOA" address="0x00027A88" value="0x00018040" />
+        <register type="NOA" address="0x00027A84" value="0x00000000" />
+        <register type="NOA" address="0x00027B04" value="0x00004000" />
+        <register type="NOA" address="0x00027B80" value="0x00000002" />
+        <register type="NOA" address="0x00027B8C" value="0x000000E0" />
+        <register type="NOA" address="0x00027B84" value="0x00000000" />
+        <register type="NOA" address="0x00026104" value="0x00002222" />
+        <register type="NOA" address="0x00026184" value="0x0C006666" />
+        <register type="NOA" address="0x00026284" value="0x04000000" />
+        <register type="NOA" address="0x00026304" value="0x04000000" />
+        <register type="NOA" address="0x00026400" value="0x00000002" />
+        <register type="NOA" address="0x00026410" value="0x000000A0" />
+        <register type="NOA" address="0x00026404" value="0x00000000" />
+        <register type="NOA" address="0x00025420" value="0x04108020" />
+        <register type="NOA" address="0x00025424" value="0x1284A420" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x00042049" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0x00800000" /> <!--OASTARTTRIG6 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0x00800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen7.5"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="b344c8cb-a291-4cbf-aa9c-b40213bfc96f"
+       chipset="HSW"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Stall"
+             description="The percentage of time in which evaluation shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_stall"
+             units="percent"
+             symbol_name="DsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Alpha Test Fails"
+             description="The total number of pixels dropped on post-FS alpha test."
+             data_type="uint64"
+             equation="A 37 READ"
+             underscore_name="alpha_test_fails"
+             units="pixels"
+             symbol_name="AlphaTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TCS Threads Dispatched"
+             description="The total number of control shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 10 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 7 READ $HsThreads UDIV"
+             underscore_name="hs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="HsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 25 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GS EU Stall"
+             description="The percentage of time in which geometry shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 23 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_stall"
+             units="percent"
+             symbol_name="GsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 30 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="CS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 17 READ $CsThreads UDIV"
+             underscore_name="cs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="CsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 23 READ $GsThreads UDIV"
+             underscore_name="gs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="GsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Typed Atomics"
+             description="The total number of typed atomics."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ UADD $EuSlicesTotalCount UMUL"
+             underscore_name="typed_atomics"
+             units="messages"
+             symbol_name="TypedAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 6 READ C 7 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 28 READ $PsThreads UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="TES EU Active"
+             description="The percentage of time in which evaluation shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_active"
+             units="percent"
+             symbol_name="DsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 3 READ $VsThreads UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="TCS EU Stall"
+             description="The percentage of time in which control shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_stall"
+             units="percent"
+             symbol_name="HsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has being processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 41 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 27 READ $PsThreads UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="TES Threads Dispatched"
+             description="The total number of evaluation shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 15 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="TES AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 12 READ $DsThreads UDIV"
+             underscore_name="ds_eu_active_per_thread"
+             units="cycles"
+             symbol_name="DsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS EU Active"
+             description="The percentage of time in which geometry shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 22 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_active"
+             units="percent"
+             symbol_name="GsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 27 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 13 READ $DsThreads UDIV"
+             underscore_name="ds_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="DsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 22 READ $GsThreads UDIV"
+             underscore_name="gs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="GsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 2 READ B 3 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of byten written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 8 READ $HsThreads UDIV"
+             underscore_name="hs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="HsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS EU Active"
+             description="The percentage of time in which control shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_active"
+             units="percent"
+             symbol_name="HsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 36 READ"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Late Depth Test Fails"
+             description="The total number of pixels dropped on post-FS depth test."
+             data_type="uint64"
+             equation="A 39 READ $SamplesKilledInPs USUB"
+             underscore_name="post_ps_depth_test_fails"
+             units="pixels"
+             symbol_name="PostPsDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 28 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 1 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 33 READ"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 2 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Active"
+             description="The percentage of time in which compute shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_active"
+             units="percent"
+             symbol_name="CsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 18 READ $CsThreads UDIV"
+             underscore_name="cs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="CsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Late Stencil Test Fails"
+             description="The total number of pixels dropped on post-FS stencil test."
+             data_type="uint64"
+             equation="A 38 READ"
+             underscore_name="post_ps_stencil_test_fails"
+             units="pixels"
+             symbol_name="PostPsStencilTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 2 READ $VsThreads UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Stall"
+             description="The percentage of time in which compute shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_stall"
+             units="percent"
+             symbol_name="CsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 4 READ B 5 READ UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 40 READ"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 3 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000253A4" value="0x00000000" />
+        <register type="NOA" address="0x0002681C" value="0x01F00800" />
+        <register type="NOA" address="0x00026820" value="0x00001000" />
+        <register type="NOA" address="0x0002781C" value="0x01F00800" />
+        <register type="NOA" address="0x00026520" value="0x00000007" />
+        <register type="NOA" address="0x000265A0" value="0x00000007" />
+        <register type="NOA" address="0x00025380" value="0x00000010" />
+        <register type="NOA" address="0x0002538C" value="0x00300000" />
+        <register type="NOA" address="0x00025384" value="0xAA8AAAAA" />
+        <register type="NOA" address="0x00025404" value="0xFFFFFFFF" />
+        <register type="NOA" address="0x00026800" value="0x00004202" />
+        <register type="NOA" address="0x00026808" value="0x00605817" />
+        <register type="NOA" address="0x0002680C" value="0x10001005" />
+        <register type="NOA" address="0x00026804" value="0x00000000" />
+        <register type="NOA" address="0x00027800" value="0x00000102" />
+        <register type="NOA" address="0x00027808" value="0x0C0701E0" />
+        <register type="NOA" address="0x0002780C" value="0x000200A0" />
+        <register type="NOA" address="0x00027804" value="0x00000000" />
+        <register type="NOA" address="0x00026484" value="0x44000000" />
+        <register type="NOA" address="0x00026704" value="0x44000000" />
+        <register type="NOA" address="0x00026500" value="0x00000006" />
+        <register type="NOA" address="0x00026510" value="0x00000001" />
+        <register type="NOA" address="0x00026504" value="0x88000000" />
+        <register type="NOA" address="0x00026580" value="0x00000006" />
+        <register type="NOA" address="0x00026590" value="0x00000020" />
+        <register type="NOA" address="0x00026584" value="0x00000000" />
+        <register type="NOA" address="0x00026104" value="0x55822222" />
+        <register type="NOA" address="0x00026184" value="0xAA866666" />
+        <register type="NOA" address="0x00025420" value="0x08320C83" />
+        <register type="NOA" address="0x00025424" value="0x06820C83" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x00000C03" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0x00800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002718" value="0xAAAAAAAA" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x0000271C" value="0xAAAAAAAA" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002724" value="0x00800000" /> <!--OASTARTTRIG6 -->
+        <register type="OA" address="0x00002728" value="0xAAAAAAAA" /> <!--OASTARTTRIG7 -->
+        <register type="OA" address="0x0000272C" value="0xAAAAAAAA" /> <!--OASTARTTRIG8 -->
+        <register type="OA" address="0x00002740" value="0x00000000" /> <!--OAREPORTTRIG1 -->
+        <register type="OA" address="0x00002744" value="0x00000000" /> <!--OAREPORTTRIG2 -->
+        <register type="OA" address="0x00002748" value="0x00000000" /> <!--OAREPORTTRIG3 -->
+        <register type="OA" address="0x0000274C" value="0x00000000" /> <!--OAREPORTTRIG4 -->
+        <register type="OA" address="0x00002750" value="0x00000000" /> <!--OAREPORTTRIG5 -->
+        <register type="OA" address="0x00002754" value="0x00000000" /> <!--OAREPORTTRIG6 -->
+        <register type="OA" address="0x00002758" value="0x00000000" /> <!--OAREPORTTRIG7 -->
+        <register type="OA" address="0x0000275C" value="0x00000000" /> <!--OAREPORTTRIG8 -->
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen7.5"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="480f9795-cf6a-4204-a9e3-cd7015515f8d"
+       chipset="HSW"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gpu_clocks"
+             units="cycles"
+             symbol_name="GpuClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUrbAtomics0"
+             description="The subslice 0 EU URB Atomics subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_urb_atomics0"
+             units="messages"
+             symbol_name="EuUrbAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x0002681C" value="0x3EB00800" />
+        <register type="NOA" address="0x00026820" value="0x00900000" />
+        <register type="NOA" address="0x00025384" value="0x02AAAAAA" />
+        <register type="NOA" address="0x00025404" value="0x03FFFFFF" />
+        <register type="NOA" address="0x00026800" value="0x00142284" />
+        <register type="NOA" address="0x00026808" value="0x0E629062" />
+        <register type="NOA" address="0x0002680C" value="0x3F6F55CB" />
+        <register type="NOA" address="0x00026810" value="0x00000014" />
+        <register type="NOA" address="0x00026804" value="0x00000000" />
+        <register type="NOA" address="0x00026104" value="0x02AAAAAA" />
+        <register type="NOA" address="0x00026184" value="0x02AAAAAA" />
+        <register type="NOA" address="0x00025420" value="0x00000000" />
+        <register type="NOA" address="0x00025424" value="0x00000000" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x00000000" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" /> <!--OASTARTTRIG6 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0xF0800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002770" value="0x0007FE2A" /> <!--OACEC0_0 -->
+        <register type="OA" address="0x00002774" value="0x0000FF00" /> <!--OACEC0_1 -->
+        <register type="OA" address="0x00002778" value="0x0007FE6A" /> <!--OACEC1_0 -->
+        <register type="OA" address="0x0000277C" value="0x0000FF00" /> <!--OACEC1_1 -->
+        <register type="OA" address="0x00002780" value="0x0007FE92" /> <!--OACEC2_0 -->
+        <register type="OA" address="0x00002784" value="0x0000FF00" /> <!--OACEC2_1 -->
+        <register type="OA" address="0x00002788" value="0x0007FEA2" /> <!--OACEC3_0 -->
+        <register type="OA" address="0x0000278C" value="0x0000FF00" /> <!--OACEC3_1 -->
+        <register type="OA" address="0x00002790" value="0x0007FE32" /> <!--OACEC4_0 -->
+        <register type="OA" address="0x00002794" value="0x0000FF00" /> <!--OACEC4_1 -->
+        <register type="OA" address="0x00002798" value="0x0007FE9A" /> <!--OACEC5_0 -->
+        <register type="OA" address="0x0000279C" value="0x0000FF00" /> <!--OACEC5_1 -->
+        <register type="OA" address="0x000027A0" value="0x0007FF23" /> <!--OACEC6_0 -->
+        <register type="OA" address="0x000027A4" value="0x0000FF00" /> <!--OACEC6_1 -->
+        <register type="OA" address="0x000027A8" value="0x0007FFF3" /> <!--OACEC7_0 -->
+        <register type="OA" address="0x000027AC" value="0x0000FFFE" /> <!--OACEC7_1 -->
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen7.5"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="399d3001-97d6-4240-b065-4fb843138e17"
+       chipset="HSW"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Stall"
+             description="The percentage of time in which evaluation shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_stall"
+             units="percent"
+             symbol_name="DsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Alpha Test Fails"
+             description="The total number of pixels dropped on post-FS alpha test."
+             data_type="uint64"
+             equation="A 37 READ"
+             underscore_name="alpha_test_fails"
+             units="pixels"
+             symbol_name="AlphaTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TES Threads Dispatched"
+             description="The total number of evaluation shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 15 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="TES AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 12 READ $DsThreads UDIV"
+             underscore_name="ds_eu_active_per_thread"
+             units="cycles"
+             symbol_name="DsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 25 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GS EU Stall"
+             description="The percentage of time in which geometry shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 23 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_stall"
+             units="percent"
+             symbol_name="GsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="LLC GPU Read Accesses"
+             description="The total number of LLC cache lookups for reads done from the GPU."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="llc_read_accesses"
+             units="messages"
+             symbol_name="LlcReadAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 30 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads (64B each)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="CS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 17 READ $CsThreads UDIV"
+             underscore_name="cs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="CsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 23 READ $GsThreads UDIV"
+             underscore_name="gs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="GsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 28 READ $PsThreads UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="TES EU Active"
+             description="The percentage of time in which evaluation shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_active"
+             units="percent"
+             symbol_name="DsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 3 READ $VsThreads UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="TCS EU Stall"
+             description="The percentage of time in which control shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_stall"
+             units="percent"
+             symbol_name="HsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has being processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 41 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 27 READ $PsThreads UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GS EU Active"
+             description="The percentage of time in which geometry shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 22 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_active"
+             units="percent"
+             symbol_name="GsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 27 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 13 READ $DsThreads UDIV"
+             underscore_name="ds_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="DsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 22 READ $GsThreads UDIV"
+             underscore_name="gs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="GsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiHiDepthMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hi_depth_memory_reads"
+             units="messages"
+             symbol_name="GtiHiDepthMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="TCS Threads Dispatched"
+             description="The total number of control shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 10 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 8 READ $HsThreads UDIV"
+             underscore_name="hs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="HsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS EU Active"
+             description="The percentage of time in which control shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_active"
+             units="percent"
+             symbol_name="HsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 36 READ"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Late Depth Test Fails"
+             description="The total number of pixels dropped on post-FS depth test."
+             data_type="uint64"
+             equation="A 39 READ $SamplesKilledInPs USUB"
+             underscore_name="post_ps_depth_test_fails"
+             units="pixels"
+             symbol_name="PostPsDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TCS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 7 READ $HsThreads UDIV"
+             underscore_name="hs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="HsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 28 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 1 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 33 READ"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 2 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Active"
+             description="The percentage of time in which compute shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_active"
+             units="percent"
+             symbol_name="CsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 18 READ $CsThreads UDIV"
+             underscore_name="cs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="CsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="Late Stencil Test Fails"
+             description="The total number of pixels dropped on post-FS stencil test."
+             data_type="uint64"
+             equation="A 38 READ"
+             underscore_name="post_ps_stencil_test_fails"
+             units="pixels"
+             symbol_name="PostPsStencilTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 2 READ $VsThreads UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="CS EU Stall"
+             description="The percentage of time in which compute shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_stall"
+             units="percent"
+             symbol_name="CsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 40 READ"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 3 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000253A4" value="0x34300000" />
+        <register type="NOA" address="0x00025440" value="0x2D800000" />
+        <register type="NOA" address="0x00025444" value="0x00000008" />
+        <register type="NOA" address="0x00025128" value="0x0E600000" />
+        <register type="NOA" address="0x00025380" value="0x00000450" />
+        <register type="NOA" address="0x00025390" value="0x00052C43" />
+        <register type="NOA" address="0x00025384" value="0x00000000" />
+        <register type="NOA" address="0x00025400" value="0x00006144" />
+        <register type="NOA" address="0x00025408" value="0x0A418820" />
+        <register type="NOA" address="0x0002540C" value="0x000820E6" />
+        <register type="NOA" address="0x00025404" value="0xFF500000" />
+        <register type="NOA" address="0x00025100" value="0x000005D6" />
+        <register type="NOA" address="0x0002510C" value="0x0EF00000" />
+        <register type="NOA" address="0x00025104" value="0x00000000" />
+        <register type="NOA" address="0x00025420" value="0x02108421" />
+        <register type="NOA" address="0x00025424" value="0x00008421" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x00000000" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" /> <!--OASTARTTRIG6 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0xF0800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x0000274C" value="0x76543298" /> <!--OAREPORTTRIG4 -->
+        <register type="OA" address="0x00002748" value="0x98989898" /> <!--OAREPORTTRIG3 -->
+        <register type="OA" address="0x00002744" value="0x000000E4" /> <!--OAREPORTTRIG2 -->
+        <register type="OA" address="0x00002740" value="0x00000000" /> <!--OAREPORTTRIG1 -->
+        <register type="OA" address="0x0000275C" value="0x98A98A98" /> <!--OAREPORTTRIG8 -->
+        <register type="OA" address="0x00002758" value="0x88888888" /> <!--OAREPORTTRIG7 -->
+        <register type="OA" address="0x00002754" value="0x000C5500" /> <!--OAREPORTTRIG6 -->
+        <register type="OA" address="0x00002750" value="0x00000000" /> <!--OAREPORTTRIG5 -->
+        <register type="OA" address="0x00002770" value="0x0007F81A" /> <!--OACEC0_0 -->
+        <register type="OA" address="0x00002774" value="0x0000FC00" /> <!--OACEC0_1 -->
+        <register type="OA" address="0x00002778" value="0x0007F82A" /> <!--OACEC1_0 -->
+        <register type="OA" address="0x0000277C" value="0x0000FC00" /> <!--OACEC1_1 -->
+        <register type="OA" address="0x00002780" value="0x0007F872" /> <!--OACEC2_0 -->
+        <register type="OA" address="0x00002784" value="0x0000FC00" /> <!--OACEC2_1 -->
+        <register type="OA" address="0x00002788" value="0x0007F8BA" /> <!--OACEC3_0 -->
+        <register type="OA" address="0x0000278C" value="0x0000FC00" /> <!--OACEC3_1 -->
+        <register type="OA" address="0x00002790" value="0x0007F87A" /> <!--OACEC4_0 -->
+        <register type="OA" address="0x00002794" value="0x0000FC00" /> <!--OACEC4_1 -->
+        <register type="OA" address="0x00002798" value="0x0007F8EA" /> <!--OACEC5_0 -->
+        <register type="OA" address="0x0000279C" value="0x0000FC00" /> <!--OACEC5_1 -->
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" /> <!--OACEC6_0 -->
+        <register type="OA" address="0x000027A4" value="0x0000FC00" /> <!--OACEC6_1 -->
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" /> <!--OACEC7_0 -->
+        <register type="OA" address="0x000027AC" value="0x0000FC00" /> <!--OACEC7_1 -->
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen7.5"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="f3c1ff4b-d0da-4ffa-8780-2c6b98f3f2d5"
+       chipset="HSW"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Stall"
+             description="The percentage of time in which evaluation shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_stall"
+             units="percent"
+             symbol_name="DsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Alpha Test Fails"
+             description="The total number of pixels dropped on post-FS alpha test."
+             data_type="uint64"
+             equation="A 37 READ"
+             underscore_name="alpha_test_fails"
+             units="pixels"
+             symbol_name="AlphaTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TES Threads Dispatched"
+             description="The total number of evaluation shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 15 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="TES AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 12 READ $DsThreads UDIV"
+             underscore_name="ds_eu_active_per_thread"
+             units="cycles"
+             symbol_name="DsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 25 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GS EU Stall"
+             description="The percentage of time in which geometry shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 23 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_stall"
+             units="percent"
+             symbol_name="GsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 30 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="CS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 17 READ $CsThreads UDIV"
+             underscore_name="cs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="CsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 23 READ $GsThreads UDIV"
+             underscore_name="gs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="GsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 28 READ $PsThreads UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="TES EU Active"
+             description="The percentage of time in which evaluation shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_active"
+             units="percent"
+             symbol_name="DsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 3 READ $VsThreads UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="TCS EU Stall"
+             description="The percentage of time in which control shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_stall"
+             units="percent"
+             symbol_name="HsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has being processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 41 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 27 READ $PsThreads UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="LLC GPU Write Accesses"
+             description="The total number of LLC cache lookups for write done from the GPU (32B writes)."
+             data_type="uint64"
+             equation="C 6 READ 2 UMUL"
+             underscore_name="llc_wr_accesses"
+             units="messages"
+             symbol_name="LlcWrAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="GS EU Active"
+             description="The percentage of time in which geometry shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 22 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_active"
+             units="percent"
+             symbol_name="GsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 27 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="TES AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 13 READ $DsThreads UDIV"
+             underscore_name="ds_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="DsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 22 READ $GsThreads UDIV"
+             underscore_name="gs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="GsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS Threads Dispatched"
+             description="The total number of control shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 10 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 8 READ $HsThreads UDIV"
+             underscore_name="hs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="HsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS EU Active"
+             description="The percentage of time in which control shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_active"
+             units="percent"
+             symbol_name="HsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 36 READ"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Late Depth Test Fails"
+             description="The total number of pixels dropped on post-FS depth test."
+             data_type="uint64"
+             equation="A 39 READ $SamplesKilledInPs USUB"
+             underscore_name="post_ps_depth_test_fails"
+             units="pixels"
+             symbol_name="PostPsDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TCS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 7 READ $HsThreads UDIV"
+             underscore_name="hs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="HsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 28 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 1 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 33 READ"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 2 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Active"
+             description="The percentage of time in which compute shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_active"
+             units="percent"
+             symbol_name="CsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 18 READ $CsThreads UDIV"
+             underscore_name="cs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="CsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Late Stencil Test Fails"
+             description="The total number of pixels dropped on post-FS stencil test."
+             data_type="uint64"
+             equation="A 38 READ"
+             underscore_name="post_ps_stencil_test_fails"
+             units="pixels"
+             symbol_name="PostPsStencilTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="LLC GPU Throughput"
+             description="The total number of GPU memory bytes transferred between GPU and LLC."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="PERFCNT1 READ_REG $LlcWrAccesses USUB 64 UMUL $LlcWrAccesses 32 UMUL UADD"
+             underscore_name="llc_gpu_throughput"
+             units="bytes"
+             symbol_name="LlcGpuThroughput"
+             availability="true $QueryMode &&"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="LLC"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 2 READ $VsThreads UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="CS EU Stall"
+             description="The percentage of time in which compute shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_stall"
+             units="percent"
+             symbol_name="CsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 40 READ"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes (64B each)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 3 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000253A4" value="0x34300000" />
+        <register type="NOA" address="0x00025440" value="0x01500000" />
+        <register type="NOA" address="0x00025444" value="0x00000120" />
+        <register type="NOA" address="0x00025128" value="0x0C200000" />
+        <register type="NOA" address="0x00025380" value="0x00000450" />
+        <register type="NOA" address="0x00025390" value="0x00052C43" />
+        <register type="NOA" address="0x00025384" value="0x00000000" />
+        <register type="NOA" address="0x00025400" value="0x00007184" />
+        <register type="NOA" address="0x00025408" value="0x0A418820" />
+        <register type="NOA" address="0x0002540C" value="0x000820E6" />
+        <register type="NOA" address="0x00025404" value="0xFF500000" />
+        <register type="NOA" address="0x00025100" value="0x000005D6" />
+        <register type="NOA" address="0x0002510C" value="0x1E700000" />
+        <register type="NOA" address="0x00025104" value="0x00000000" />
+        <register type="NOA" address="0x00025420" value="0x02108421" />
+        <register type="NOA" address="0x00025424" value="0x00008421" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x00000000" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" /> <!--OASTARTTRIG6 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0xF0800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x0000274C" value="0x76543298" /> <!--OAREPORTTRIG4 -->
+        <register type="OA" address="0x00002748" value="0x98989898" /> <!--OAREPORTTRIG3 -->
+        <register type="OA" address="0x00002744" value="0x000000E4" /> <!--OAREPORTTRIG2 -->
+        <register type="OA" address="0x00002740" value="0x00000000" /> <!--OAREPORTTRIG1 -->
+        <register type="OA" address="0x0000275C" value="0xBABABABA" /> <!--OAREPORTTRIG8 -->
+        <register type="OA" address="0x00002758" value="0x88888888" /> <!--OAREPORTTRIG7 -->
+        <register type="OA" address="0x00002754" value="0x000C5500" /> <!--OAREPORTTRIG6 -->
+        <register type="OA" address="0x00002750" value="0x00000000" /> <!--OAREPORTTRIG5 -->
+        <register type="OA" address="0x00002770" value="0x0007F81A" /> <!--OACEC0_0 -->
+        <register type="OA" address="0x00002774" value="0x0000FC00" /> <!--OACEC0_1 -->
+        <register type="OA" address="0x00002778" value="0x0007F82A" /> <!--OACEC1_0 -->
+        <register type="OA" address="0x0000277C" value="0x0000FC00" /> <!--OACEC1_1 -->
+        <register type="OA" address="0x00002780" value="0x0007F822" /> <!--OACEC2_0 -->
+        <register type="OA" address="0x00002784" value="0x0000FC00" /> <!--OACEC2_1 -->
+        <register type="OA" address="0x00002788" value="0x0007F8BA" /> <!--OACEC3_0 -->
+        <register type="OA" address="0x0000278C" value="0x0000FC00" /> <!--OACEC3_1 -->
+        <register type="OA" address="0x00002790" value="0x0007F87A" /> <!--OACEC4_0 -->
+        <register type="OA" address="0x00002794" value="0x0000FC00" /> <!--OACEC4_1 -->
+        <register type="OA" address="0x00002798" value="0x0007F8EA" /> <!--OACEC5_0 -->
+        <register type="OA" address="0x0000279C" value="0x0000FC00" /> <!--OACEC5_1 -->
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" /> <!--OACEC6_0 -->
+        <register type="OA" address="0x000027A4" value="0x0000FC00" /> <!--OACEC6_1 -->
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" /> <!--OACEC7_0 -->
+        <register type="OA" address="0x000027AC" value="0x0000FC00" /> <!--OACEC7_1 -->
+    </register_config>
+  </set>
+
+  <set name="Metric set SamplerBalance"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler_balance"
+       hw_config_guid="e111cda4-19c3-41ee-b326-f99ac44ebf78"
+       chipset="HSW"
+       symbol_name="SamplerBalance"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Stall"
+             description="The percentage of time in which evaluation shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_stall"
+             units="percent"
+             symbol_name="DsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="LLC GPU Accesses"
+             description="The total number of LLC cache lookups done from the GPU (64b reads, 32B writes)."
+             data_type="uint64"
+             equation="PERFCNT1 READ_REG"
+             underscore_name="llc_accesses"
+             units="messages"
+             symbol_name="LlcAccesses"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Sampler L2 cache misses (ss3)"
+             description="Number of sampler L2 cache misses (ss3)"
+             data_type="uint64"
+             equation="C 1 READ C 0 READ UADD"
+             underscore_name="sampler3_l2_cache_misses"
+             units="messages"
+             symbol_name="Sampler3L2CacheMisses"
+             availability="$SubsliceMask 0x8 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Alpha Test Fails"
+             description="The total number of pixels dropped on post-FS alpha test."
+             data_type="uint64"
+             equation="A 37 READ"
+             underscore_name="alpha_test_fails"
+             units="pixels"
+             symbol_name="AlphaTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TES Threads Dispatched"
+             description="The total number of evaluation shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 15 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="TES AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 12 READ $DsThreads UDIV"
+             underscore_name="ds_eu_active_per_thread"
+             units="cycles"
+             symbol_name="DsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 25 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GS EU Stall"
+             description="The percentage of time in which geometry shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 23 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_stall"
+             units="percent"
+             symbol_name="GsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Active"
+             description="The percentage of time in which compute shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_active"
+             units="percent"
+             symbol_name="CsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 2 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS EU Active"
+             description="The percentage of time in which control shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_active"
+             units="percent"
+             symbol_name="HsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TES EU Active"
+             description="The percentage of time in which evaluation shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_eu_active"
+             units="percent"
+             symbol_name="DsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Evaluation Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS EU Active"
+             description="The percentage of time in which geometry shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 22 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_eu_active"
+             units="percent"
+             symbol_name="GsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 27 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS EU Stall"
+             description="The percentage of time in which compute shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cs_eu_stall"
+             units="percent"
+             symbol_name="CsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 1 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 3 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS EU Stall"
+             description="The percentage of time in which control shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_eu_stall"
+             units="percent"
+             symbol_name="HsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 28 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="CS Duration"
+             description="Total Compute Shader GPU duration."
+             data_type="uint64"
+             equation="A 17 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 18 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="cs_duration"
+             units="us"
+             symbol_name="CsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 30 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="TES Duration"
+             description="Total Evaluation Shader GPU duration."
+             data_type="uint64"
+             equation="A 12 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 13 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="ds_duration"
+             units="us"
+             symbol_name="DsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS Duration"
+             description="Total Geometry Shader GPU duration."
+             data_type="uint64"
+             equation="A 22 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 23 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="gs_duration"
+             units="us"
+             symbol_name="GsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 20 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="CS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 17 READ $CsThreads UDIV"
+             underscore_name="cs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="CsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="EU Array/Compute Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler L2 cache misses"
+             description="Number of sampler L2 cache misses"
+             data_type="uint64"
+             equation="C 7 READ C 6 READ UADD C 5 READ UADD C 4 READ UADD C 3 READ UADD C 2 READ UADD C 1 READ UADD C 0 READ UADD"
+             underscore_name="sampler_l2_cache_misses"
+             units="messages"
+             symbol_name="SamplerL2CacheMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="GS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 23 READ $GsThreads UDIV"
+             underscore_name="gs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="GsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Sampler L2 cache misses (ss2)"
+             description="Number of sampler L2 cache misses (ss2)"
+             data_type="uint64"
+             equation="C 3 READ C 2 READ UADD"
+             underscore_name="sampler2_l2_cache_misses"
+             units="messages"
+             symbol_name="Sampler2L2CacheMisses"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Idle"
+             description="The percentage of time in which the Execution Units were idle."
+             data_type="float"
+             max_equation="100"
+             equation="100 $EuActive $EuStall FADD FSUB"
+             underscore_name="eu_idle"
+             units="percent"
+             symbol_name="EuIdle"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 28 READ $PsThreads UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 3 READ $VsThreads UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has being processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 41 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 27 READ $PsThreads UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="TCS Duration"
+             description="Total Control Shader GPU duration."
+             data_type="uint64"
+             equation="A 7 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 8 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="hs_duration"
+             units="us"
+             symbol_name="HsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TES AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which evaluation shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 13 READ $DsThreads UDIV"
+             underscore_name="ds_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="DsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Evaluation Shader"
+             />
+    <counter name="GS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which geometry shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 22 READ $GsThreads UDIV"
+             underscore_name="gs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="GsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TCS Threads Dispatched"
+             description="The total number of control shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 10 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="TCS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 8 READ $HsThreads UDIV"
+             underscore_name="hs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="HsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Control Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 36 READ"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Late Depth Test Fails"
+             description="The total number of pixels dropped on post-FS depth test."
+             data_type="uint64"
+             equation="A 39 READ $SamplesKilledInPs USUB"
+             underscore_name="post_ps_depth_test_fails"
+             units="pixels"
+             symbol_name="PostPsDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="TCS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which control shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 7 READ $HsThreads UDIV"
+             underscore_name="hs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="HsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Control Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Duration"
+             description="Total Fragment Shader GPU duration."
+             data_type="uint64"
+             equation="A 27 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 28 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="ps_duration"
+             units="us"
+             symbol_name="PsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler L2 cache misses (ss1)"
+             description="Number of sampler L2 cache misses (ss1)"
+             data_type="uint64"
+             equation="C 5 READ C 4 READ UADD"
+             underscore_name="sampler1_l2_cache_misses"
+             units="messages"
+             symbol_name="Sampler1L2CacheMisses"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 33 READ"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="CS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which compute shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 18 READ $CsThreads UDIV"
+             underscore_name="cs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="CsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="LLC GPU Hits"
+             description="The total number of successful LLC cache lookups done from the GPU."
+             data_type="uint64"
+             equation="PERFCNT2 READ_REG"
+             underscore_name="llc_hits"
+             units="messages"
+             symbol_name="LlcHits"
+             availability="true $QueryMode &&"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="LLC"
+             />
+    <counter name="Late Stencil Test Fails"
+             description="The total number of pixels dropped on post-FS stencil test."
+             data_type="uint64"
+             equation="A 38 READ"
+             underscore_name="post_ps_stencil_test_fails"
+             units="pixels"
+             symbol_name="PostPsStencilTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Sampler L2 cache misses (ss0)"
+             description="Number of sampler L2 cache misses (ss0)"
+             data_type="uint64"
+             equation="C 7 READ C 6 READ UADD"
+             underscore_name="sampler0_l2_cache_misses"
+             units="messages"
+             symbol_name="Sampler0L2CacheMisses"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             max_equation="100"
+             equation="A 2 READ $VsThreads UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Duration"
+             description="Total Vertex Shader GPU duration."
+             data_type="uint64"
+             equation="A 2 READ  A 0 READ UMUL  A 2 READ  A 7 READ UADD  A 12 READ UADD  A 17 READ UADD  A 22 READ UADD  A 27 READ UADD UDIV  A 3 READ  A 1 READ UMUL  A 3 READ  A 8 READ UADD  A 13 READ UADD  A 18 READ UADD  A 23 READ UADD  A 28 READ UADD UDIV UADD $GpuTime UMUL $GpuCoreClocks $EuCoresTotalCount UMUL 1000 UMUL UDIV"
+             underscore_name="vs_duration"
+             units="us"
+             symbol_name="VsDuration"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 40 READ"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x0002EB9C" value="0x01906400" />
+        <register type="NOA" address="0x0002FB9C" value="0x01906400" />
+        <register type="NOA" address="0x000253A4" value="0x00000000" />
+        <register type="NOA" address="0x00026B9C" value="0x01906400" />
+        <register type="NOA" address="0x00027B9C" value="0x01906400" />
+        <register type="NOA" address="0x00027104" value="0x00A00000" />
+        <register type="NOA" address="0x00027184" value="0x00A50000" />
+        <register type="NOA" address="0x0002E804" value="0x00500000" />
+        <register type="NOA" address="0x0002E984" value="0x00500000" />
+        <register type="NOA" address="0x0002EB04" value="0x00500000" />
+        <register type="NOA" address="0x0002EB80" value="0x00000084" />
+        <register type="NOA" address="0x0002EB8C" value="0x14200000" />
+        <register type="NOA" address="0x0002EB84" value="0x00000000" />
+        <register type="NOA" address="0x0002F804" value="0x00050000" />
+        <register type="NOA" address="0x0002F984" value="0x00050000" />
+        <register type="NOA" address="0x0002FB04" value="0x00050000" />
+        <register type="NOA" address="0x0002FB80" value="0x00000084" />
+        <register type="NOA" address="0x0002FB8C" value="0x00050800" />
+        <register type="NOA" address="0x0002FB84" value="0x00000000" />
+        <register type="NOA" address="0x00025380" value="0x00000010" />
+        <register type="NOA" address="0x0002538C" value="0x000000C0" />
+        <register type="NOA" address="0x00025384" value="0xAA550000" />
+        <register type="NOA" address="0x00025404" value="0xFFFFC000" />
+        <register type="NOA" address="0x00026804" value="0x50000000" />
+        <register type="NOA" address="0x00026984" value="0x50000000" />
+        <register type="NOA" address="0x00026B04" value="0x50000000" />
+        <register type="NOA" address="0x00026B80" value="0x00000084" />
+        <register type="NOA" address="0x00026B90" value="0x00050800" />
+        <register type="NOA" address="0x00026B84" value="0x00000000" />
+        <register type="NOA" address="0x00027804" value="0x05000000" />
+        <register type="NOA" address="0x00027984" value="0x05000000" />
+        <register type="NOA" address="0x00027B04" value="0x05000000" />
+        <register type="NOA" address="0x00027B80" value="0x00000084" />
+        <register type="NOA" address="0x00027B90" value="0x00000142" />
+        <register type="NOA" address="0x00027B84" value="0x00000000" />
+        <register type="NOA" address="0x00026104" value="0xA0000000" />
+        <register type="NOA" address="0x00026184" value="0xA5000000" />
+        <register type="NOA" address="0x00025424" value="0x00008620" />
+        <register type="NOA" address="0x0002541C" value="0x00000000" />
+        <register type="NOA" address="0x00025428" value="0x0004A54A" />
+        <register type="NOA" address="0x000091BC" value="0xE0400000" />
+        <register type="NOA" address="0x000091C4" value="0xE4500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" /> <!--OAREPORTTRIG1 -->
+        <register type="OA" address="0x00002744" value="0x00800000" /> <!--OAREPORTTRIG2 -->
+        <register type="OA" address="0x00002710" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002714" value="0x00800000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002720" value="0x00000000" /> <!--OASTARTTRIG1 -->
+        <register type="OA" address="0x00002724" value="0x00800000" /> <!--OASTARTTRIG6 -->
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-icl.xml b/lib/i915/perf-configs/oa-icl.xml
new file mode 100644
index 00000000..b78d4aa2
--- /dev/null
+++ b/lib/i915/perf-configs/oa-icl.xml
@@ -0,0 +1,11899 @@
+<?xml version="1.0"?>
+<metrics version="1562317149" merge_md5="">
+  <set name="Render Metrics Basic Gen11"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="193093b2-da24-49bf-b407-442c213b71b4"
+       chipset="ICL"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler00 Busy"
+             description="The percentage of time in which Slice0 Sampler0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_busy"
+             units="percent"
+             symbol_name="Sampler00Busy"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler00Busy"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Sampler00 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Slice0 Sampler0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler00_bottleneck"
+             units="percent"
+             symbol_name="Sampler00Bottleneck"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 1 READ B 3 READ UADD B 4 READ UADD B 5 READ UADD UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler00Bottleneck"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             availability="$SubsliceMask 9 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 0 READ B 2 READ UADD UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x142C0014" />
+        <register type="NOA" address="0x00009888" value="0x14120700" />
+        <register type="NOA" address="0x00009888" value="0x121500E0" />
+        <register type="NOA" address="0x00009888" value="0x1C1E000C" />
+        <register type="NOA" address="0x00009888" value="0x0E1F000C" />
+        <register type="NOA" address="0x00009888" value="0x1C200014" />
+        <register type="NOA" address="0x00009888" value="0x16212800" />
+        <register type="NOA" address="0x00009888" value="0x0E2C2041" />
+        <register type="NOA" address="0x00009888" value="0x102C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0000" />
+        <register type="NOA" address="0x00009888" value="0x10040140" />
+        <register type="NOA" address="0x00009888" value="0x0E040005" />
+        <register type="NOA" address="0x00009888" value="0x14050050" />
+        <register type="NOA" address="0x00009888" value="0x06054000" />
+        <register type="NOA" address="0x00009888" value="0x08051000" />
+        <register type="NOA" address="0x00009888" value="0x260600C0" />
+        <register type="NOA" address="0x00009888" value="0x24061800" />
+        <register type="NOA" address="0x00009888" value="0x04120023" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x08120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04144000" />
+        <register type="NOA" address="0x00009888" value="0x02150980" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x1815000F" />
+        <register type="NOA" address="0x00009888" value="0x06150000" />
+        <register type="NOA" address="0x00009888" value="0x08154000" />
+        <register type="NOA" address="0x00009888" value="0x0E18A000" />
+        <register type="NOA" address="0x00009888" value="0x14190028" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1A1C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C1C000A" />
+        <register type="NOA" address="0x00009888" value="0x1A5C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C5C000A" />
+        <register type="NOA" address="0x00009888" value="0x001C0097" />
+        <register type="NOA" address="0x00009888" value="0x061C9400" />
+        <register type="NOA" address="0x00009888" value="0x0A1C00A7" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x081D8100" />
+        <register type="NOA" address="0x00009888" value="0x0A1D0004" />
+        <register type="NOA" address="0x00009888" value="0x085C9497" />
+        <register type="NOA" address="0x00009888" value="0x0A5CA700" />
+        <register type="NOA" address="0x00009888" value="0x105C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A5D000B" />
+        <register type="NOA" address="0x00009888" value="0x181E8000" />
+        <register type="NOA" address="0x00009888" value="0x1E1EEF80" />
+        <register type="NOA" address="0x00009888" value="0x301F4000" />
+        <register type="NOA" address="0x00009888" value="0x501F2404" />
+        <register type="NOA" address="0x00009888" value="0x521F0092" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2000" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0300" />
+        <register type="NOA" address="0x00009888" value="0x461F0303" />
+        <register type="NOA" address="0x00009888" value="0x481F0303" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0003" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F4001" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E65C" value="0xFFFFFFFF" />
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00051050" />
+        <register type="FLEX" address="0x0000E45C" value="0x00000052" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen11"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="233a477b-f8f0-40f4-bf57-01440c3701d9"
+       chipset="ICL"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 3 READ C 2 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ C 4 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Typed Atomics Accesses"
+             description="The total number of typed atomic accesses via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 4 READ B 5 READ FADD 2 FDIV $EuSubslicesTotalCount FMUL"
+             underscore_name="typed_atomics"
+             units="events"
+             symbol_name="TypedAtomics"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 1 READ B 3 READ UADD B 7 READ UADD B 6 READ UADD UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 0 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 7 READ C 6 READ UADD $EuSubslicesTotalCount UMUL 32 UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 13 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="64  B 0 READ B 2 READ UADD UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x12230012" />
+        <register type="NOA" address="0x00009888" value="0x10230019" />
+        <register type="NOA" address="0x00009888" value="0x12A30012" />
+        <register type="NOA" address="0x00009888" value="0x10A30019" />
+        <register type="NOA" address="0x00009888" value="0x1A200400" />
+        <register type="NOA" address="0x00009888" value="0x1C200020" />
+        <register type="NOA" address="0x00009888" value="0x04208000" />
+        <register type="NOA" address="0x00009888" value="0x08208000" />
+        <register type="NOA" address="0x00009888" value="0x0C208000" />
+        <register type="NOA" address="0x00009888" value="0x0A230031" />
+        <register type="NOA" address="0x00009888" value="0x0E231E00" />
+        <register type="NOA" address="0x00009888" value="0x0223003D" />
+        <register type="NOA" address="0x00009888" value="0x04230032" />
+        <register type="NOA" address="0x00009888" value="0x06230033" />
+        <register type="NOA" address="0x00009888" value="0x00230000" />
+        <register type="NOA" address="0x00009888" value="0x1AA01000" />
+        <register type="NOA" address="0x00009888" value="0x1CA00008" />
+        <register type="NOA" address="0x00009888" value="0x02A08000" />
+        <register type="NOA" address="0x00009888" value="0x06A08000" />
+        <register type="NOA" address="0x00009888" value="0x0AA08000" />
+        <register type="NOA" address="0x00009888" value="0x0AA31880" />
+        <register type="NOA" address="0x00009888" value="0x0EA3003C" />
+        <register type="NOA" address="0x00009888" value="0x00A31E80" />
+        <register type="NOA" address="0x00009888" value="0x02A31900" />
+        <register type="NOA" address="0x00009888" value="0x04A31980" />
+        <register type="NOA" address="0x00009888" value="0x0E044055" />
+        <register type="NOA" address="0x00009888" value="0x10040141" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050050" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600CC" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x18123000" />
+        <register type="NOA" address="0x00009888" value="0x1A12000C" />
+        <register type="NOA" address="0x00009888" value="0x0212C000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0A12C000" />
+        <register type="NOA" address="0x00009888" value="0x08138000" />
+        <register type="NOA" address="0x00009888" value="0x0A134000" />
+        <register type="NOA" address="0x00009888" value="0x0413A000" />
+        <register type="NOA" address="0x00009888" value="0x06132000" />
+        <register type="NOA" address="0x00009888" value="0x0A148000" />
+        <register type="NOA" address="0x00009888" value="0x0E144000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x04148000" />
+        <register type="NOA" address="0x00009888" value="0x16150380" />
+        <register type="NOA" address="0x00009888" value="0x1815000D" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x0415C000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A154000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x0A182000" />
+        <register type="NOA" address="0x00009888" value="0x0E188000" />
+        <register type="NOA" address="0x00009888" value="0x02182000" />
+        <register type="NOA" address="0x00009888" value="0x04182000" />
+        <register type="NOA" address="0x00009888" value="0x06182000" />
+        <register type="NOA" address="0x00009888" value="0x12190400" />
+        <register type="NOA" address="0x00009888" value="0x14190020" />
+        <register type="NOA" address="0x00009888" value="0x0A192000" />
+        <register type="NOA" address="0x00009888" value="0x0C192000" />
+        <register type="NOA" address="0x00009888" value="0x0E192000" />
+        <register type="NOA" address="0x00009888" value="0x0A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E1C2000" />
+        <register type="NOA" address="0x00009888" value="0x001C8000" />
+        <register type="NOA" address="0x00009888" value="0x021C8000" />
+        <register type="NOA" address="0x00009888" value="0x041C8000" />
+        <register type="NOA" address="0x00009888" value="0x121D1000" />
+        <register type="NOA" address="0x00009888" value="0x141D0008" />
+        <register type="NOA" address="0x00009888" value="0x081D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A1D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1D8000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1A1C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C1C000A" />
+        <register type="NOA" address="0x00009888" value="0x1A5C01C0" />
+        <register type="NOA" address="0x00009888" value="0x1C5C000A" />
+        <register type="NOA" address="0x00009888" value="0x001C0097" />
+        <register type="NOA" address="0x00009888" value="0x061C9400" />
+        <register type="NOA" address="0x00009888" value="0x0C1CA700" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x081D8100" />
+        <register type="NOA" address="0x00009888" value="0x0A1D0020" />
+        <register type="NOA" address="0x00009888" value="0x085C9497" />
+        <register type="NOA" address="0x00009888" value="0x0C5C00A7" />
+        <register type="NOA" address="0x00009888" value="0x105C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A5D0013" />
+        <register type="NOA" address="0x00009888" value="0x181E8000" />
+        <register type="NOA" address="0x00009888" value="0x1E1E0F80" />
+        <register type="NOA" address="0x00009888" value="0x201E000B" />
+        <register type="NOA" address="0x00009888" value="0x301F4000" />
+        <register type="NOA" address="0x00009888" value="0x501F2524" />
+        <register type="NOA" address="0x00009888" value="0x521F2522" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2430" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0300" />
+        <register type="NOA" address="0x00009888" value="0x461F0303" />
+        <register type="NOA" address="0x00009888" value="0x481F3003" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0300" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0003" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F3000" />
+        <register type="NOA" address="0x00009888" value="0x421F3000" />
+        <register type="NOA" address="0x00009888" value="0x441F3000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="ComputeExtended Gen11"
+       mdapi_supported_apis="OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="43eb7fc1-dc5e-45e2-a90a-0053f5397271"
+       chipset="ICL"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="B 7 READ B 1 READ FADD C 2 READ FADD C 3 READ FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu Typed Atomics 00"
+             description="Slice0 Dualsubslice 0 Eu Typed Atomics"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_atomics00"
+             units="messages"
+             symbol_name="EuTypedAtomics00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 00"
+             description="Slice 0 Dualsubslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="typed_atomics00"
+             units="messages"
+             symbol_name="TypedAtomics00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics00 $TypedAtomics00 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu 64 Untyped Reads 00"
+             description="Slice0 Dualsubslice 0 Eu 64 Untyped Reads"
+             data_type="float"
+             equation="B 5 READ C 1 READ FADD B 6 READ FADD"
+             underscore_name="eu_a64_untyped_reads00"
+             units="messages"
+             symbol_name="EuA64UntypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu A32 Untyped Writes 00"
+             description="Slice0 Dualsubslice 0 Eu A32 Untyped Writes"
+             data_type="uint64"
+             equation="B 7 READ B 1 READ UADD"
+             underscore_name="eu_a32_untyped_writes00"
+             units="messages"
+             symbol_name="EuA32UntypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Eu Typed Reads 00"
+             description="Slice0 Dualsubslice 0 Eu Typed Reads"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_reads00"
+             units="messages"
+             symbol_name="EuTypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu Typed Writes 00"
+             description="Slice0 Dualsubslice 0 Eu Typed Writes"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_typed_writes00"
+             units="messages"
+             symbol_name="EuTypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Writes 00"
+             description="Slice 0 Dualsubslice 0 typed writes."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="typed_writes00"
+             units="messages"
+             symbol_name="TypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites00 $TypedWrites00 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes 00"
+             description="Slice 0 Dualsubslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_writes00"
+             units="messages"
+             symbol_name="UntypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 00"
+             description="Slice 0 Dualsubslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="untyped_reads00"
+             units="messages"
+             symbol_name="UntypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu A64 Untyped Writes 00"
+             description="Slice0 Dualsubslice 0 Eu A64 Untyped Writes"
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="eu_a64_untyped_writes00"
+             units="messages"
+             symbol_name="EuA64UntypedWrites00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="B 0 READ B 5 READ C 1 READ FADD B 6 READ FADD FADD C 4 READ FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 00"
+             description="Slice 0 Dualsubslice 0 typed reads."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="typed_reads00"
+             units="messages"
+             symbol_name="TypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads00 $TypedReads00 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Eu A32 Untyped Reads 00"
+             description="Slice0 Dualsubslice 0 Eu A32 Untyped Reads"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_a32_untyped_reads00"
+             units="messages"
+             symbol_name="EuA32UntypedReads00"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x1222000B" />
+        <register type="NOA" address="0x00009888" value="0x16220009" />
+        <register type="NOA" address="0x00009888" value="0x12230019" />
+        <register type="NOA" address="0x00009888" value="0x10230012" />
+        <register type="NOA" address="0x00009888" value="0x101E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1EF800" />
+        <register type="NOA" address="0x00009888" value="0x1C1E0007" />
+        <register type="NOA" address="0x00009888" value="0x001F8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1FF800" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0007" />
+        <register type="NOA" address="0x00009888" value="0x00204000" />
+        <register type="NOA" address="0x00009888" value="0x0E204000" />
+        <register type="NOA" address="0x00009888" value="0x1A202AA0" />
+        <register type="NOA" address="0x00009888" value="0x1C200005" />
+        <register type="NOA" address="0x00009888" value="0x04208000" />
+        <register type="NOA" address="0x00009888" value="0x06208000" />
+        <register type="NOA" address="0x00009888" value="0x08208000" />
+        <register type="NOA" address="0x00009888" value="0x0A208000" />
+        <register type="NOA" address="0x00009888" value="0x0C208000" />
+        <register type="NOA" address="0x00009888" value="0x00214000" />
+        <register type="NOA" address="0x00009888" value="0x0E214000" />
+        <register type="NOA" address="0x00009888" value="0x14214000" />
+        <register type="NOA" address="0x00009888" value="0x16210555" />
+        <register type="NOA" address="0x00009888" value="0x00220011" />
+        <register type="NOA" address="0x00009888" value="0x06220900" />
+        <register type="NOA" address="0x00009888" value="0x08220A13" />
+        <register type="NOA" address="0x00009888" value="0x0A220B15" />
+        <register type="NOA" address="0x00009888" value="0x0C222317" />
+        <register type="NOA" address="0x00009888" value="0x0E220043" />
+        <register type="NOA" address="0x00009888" value="0x02231AB4" />
+        <register type="NOA" address="0x00009888" value="0x04231DBA" />
+        <register type="NOA" address="0x00009888" value="0x06230039" />
+        <register type="NOA" address="0x00009888" value="0x00230000" />
+        <register type="NOA" address="0x00009888" value="0x0C044400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040055" />
+        <register type="NOA" address="0x00009888" value="0x04051000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050015" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FD00" />
+        <register type="NOA" address="0x00009888" value="0x2606007F" />
+        <register type="NOA" address="0x00009888" value="0x0015C000" />
+        <register type="NOA" address="0x00009888" value="0x0E15C000" />
+        <register type="NOA" address="0x00009888" value="0x16157FF8" />
+        <register type="NOA" address="0x00009888" value="0x18150003" />
+        <register type="NOA" address="0x00009888" value="0x0415C000" />
+        <register type="NOA" address="0x00009888" value="0x0615C000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A15C000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x00182000" />
+        <register type="NOA" address="0x00009888" value="0x0618A000" />
+        <register type="NOA" address="0x00009888" value="0x0818A000" />
+        <register type="NOA" address="0x00009888" value="0x0A18A000" />
+        <register type="NOA" address="0x00009888" value="0x0C18A000" />
+        <register type="NOA" address="0x00009888" value="0x0E182000" />
+        <register type="NOA" address="0x00009888" value="0x0218A000" />
+        <register type="NOA" address="0x00009888" value="0x0418A000" />
+        <register type="NOA" address="0x00009888" value="0x08192000" />
+        <register type="NOA" address="0x00009888" value="0x0E19A000" />
+        <register type="NOA" address="0x00009888" value="0x12195540" />
+        <register type="NOA" address="0x00009888" value="0x1419000A" />
+        <register type="NOA" address="0x00009888" value="0x0A19A000" />
+        <register type="NOA" address="0x00009888" value="0x0C19A000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x16136860" />
+        <register type="NOA" address="0x00009888" value="0x24000004" />
+        <register type="NOA" address="0x00009888" value="0x20000040" />
+        <register type="NOA" address="0x00009888" value="0x0E132980" />
+        <register type="NOA" address="0x00009888" value="0x00132D80" />
+        <register type="NOA" address="0x00009888" value="0x10130000" />
+        <register type="NOA" address="0x00009888" value="0x1A130000" />
+        <register type="NOA" address="0x00009888" value="0x02130000" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F000C" />
+        <register type="NOA" address="0x00009888" value="0x3A1F2000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2413" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F3013" />
+        <register type="NOA" address="0x00009888" value="0x421F3030" />
+        <register type="NOA" address="0x00009888" value="0x441F3030" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x30000036" />
+        <register type="OA" address="0x00002774" value="0x01FFFE00" />
+        <register type="OA" address="0x00002778" value="0x31000034" />
+        <register type="OA" address="0x0000277C" value="0x01FFFE00" />
+        <register type="OA" address="0x00002780" value="0x00000C9A" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x00000C92" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x00000CA2" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x00000E42" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x00000E6A" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x00000C32" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+        <register type="OA" address="0x0000274C" value="0x87643210" />
+        <register type="OA" address="0x00002744" value="0x00001811" />
+        <register type="OA" address="0x00002748" value="0x87654310" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen11"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="022b8913-ae9f-4559-abcd-583e586170d0"
+       chipset="ICL"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank3."
+             data_type="uint64"
+             equation="C 4 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank0 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank0."
+             data_type="uint64"
+             equation="C 7 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank1 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank1."
+             data_type="uint64"
+             equation="C 6 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank2 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank2."
+             data_type="uint64"
+             equation="C 5 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank4 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank4."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="l3_bank04_accesses"
+             units="messages"
+             symbol_name="L3Bank04Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank5 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank5."
+             data_type="uint64"
+             equation="C 2 READ 2 UMUL"
+             underscore_name="l3_bank05_accesses"
+             units="messages"
+             symbol_name="L3Bank05Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank6 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank6."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank06_accesses"
+             units="messages"
+             symbol_name="L3Bank06Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="Slice0 L3 Bank7 Accesses"
+             description="The total number of accesses to Slice0 L3 Bank7."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank07_accesses"
+             units="messages"
+             symbol_name="L3Bank07Accesses"
+             availability="$SliceMask 1 AND"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="$L3Bank00Accesses $L3Bank01Accesses UADD $L3Bank02Accesses UADD $L3Bank03Accesses UADD $L3Bank04Accesses UADD $L3Bank05Accesses UADD $L3Bank06Accesses UADD $L3Bank07Accesses UADD"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="64  B 7 READ B 6 READ UADD 8 UMUL UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ A 10 READ A 11 READ FADD A 9 READ FSUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="2 B 5 READ B 4 READ UADD UMUL"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="$SamplerAccesses 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="B 7 READ B 6 READ UADD 8 UMUL A 32 READ UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 2 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 3 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14120700" />
+        <register type="NOA" address="0x00009888" value="0x121500E0" />
+        <register type="NOA" address="0x00009888" value="0x10040154" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E040055" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600F0" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x0C120023" />
+        <register type="NOA" address="0x00009888" value="0x0E12152B" />
+        <register type="NOA" address="0x00009888" value="0x00121480" />
+        <register type="NOA" address="0x00009888" value="0x02120028" />
+        <register type="NOA" address="0x00009888" value="0x10120000" />
+        <register type="NOA" address="0x00009888" value="0x18120000" />
+        <register type="NOA" address="0x00009888" value="0x1A120000" />
+        <register type="NOA" address="0x00009888" value="0x04120000" />
+        <register type="NOA" address="0x00009888" value="0x0A13D000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0C144000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x0C150980" />
+        <register type="NOA" address="0x00009888" value="0x02154D80" />
+        <register type="NOA" address="0x00009888" value="0x04154C9A" />
+        <register type="NOA" address="0x00009888" value="0x06150018" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x16150800" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x08150000" />
+        <register type="NOA" address="0x00009888" value="0x0A150000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x0A1473A0" />
+        <register type="NOA" address="0x00009888" value="0x1217241C" />
+        <register type="NOA" address="0x00009888" value="0x22000550" />
+        <register type="NOA" address="0x00009888" value="0x18137C00" />
+        <register type="NOA" address="0x00009888" value="0x1A130001" />
+        <register type="NOA" address="0x00009888" value="0x061434A0" />
+        <register type="NOA" address="0x00009888" value="0x00140000" />
+        <register type="NOA" address="0x00009888" value="0x081710B0" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x501F1124" />
+        <register type="NOA" address="0x00009888" value="0x521F4849" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x461F3100" />
+        <register type="NOA" address="0x00009888" value="0x481F3131" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0031" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0030" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F3030" />
+        <register type="NOA" address="0x00009888" value="0x441F3030" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen11"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="03c7a167-2abc-4ba6-878a-f1d80082abca"
+       chipset="ICL"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x001F001E" />
+        <register type="NOA" address="0x00009888" value="0x10160000" />
+        <register type="NOA" address="0x00009888" value="0x1017001F" />
+        <register type="NOA" address="0x00009888" value="0x0A1F0005" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A200800" />
+        <register type="NOA" address="0x00009888" value="0x10040015" />
+        <register type="NOA" address="0x00009888" value="0x0E054000" />
+        <register type="NOA" address="0x00009888" value="0x14050005" />
+        <register type="NOA" address="0x00009888" value="0x26060038" />
+        <register type="NOA" address="0x00009888" value="0x16157E00" />
+        <register type="NOA" address="0x00009888" value="0x0C160022" />
+        <register type="NOA" address="0x00009888" value="0x08160000" />
+        <register type="NOA" address="0x00009888" value="0x0C170540" />
+        <register type="NOA" address="0x00009888" value="0x04170000" />
+        <register type="NOA" address="0x00009888" value="0x0A188000" />
+        <register type="NOA" address="0x00009888" value="0x0C181000" />
+        <register type="NOA" address="0x00009888" value="0x12195000" />
+        <register type="NOA" address="0x00009888" value="0x14190001" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x12010000" />
+        <register type="NOA" address="0x00009888" value="0x100B7C00" />
+        <register type="NOA" address="0x00009888" value="0x100F0019" />
+        <register type="NOA" address="0x00009888" value="0x10107C00" />
+        <register type="NOA" address="0x00009888" value="0x16100000" />
+        <register type="NOA" address="0x00009888" value="0x00110000" />
+        <register type="NOA" address="0x00009888" value="0x120703C0" />
+        <register type="NOA" address="0x00009888" value="0x10090000" />
+        <register type="NOA" address="0x00009888" value="0x06010080" />
+        <register type="NOA" address="0x00009888" value="0x0E014180" />
+        <register type="NOA" address="0x00009888" value="0x10010000" />
+        <register type="NOA" address="0x00009888" value="0x00014000" />
+        <register type="NOA" address="0x00009888" value="0x060B0015" />
+        <register type="NOA" address="0x00009888" value="0x080B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A0B2000" />
+        <register type="NOA" address="0x00009888" value="0x020BA000" />
+        <register type="NOA" address="0x00009888" value="0x040BA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0E0A02" />
+        <register type="NOA" address="0x00009888" value="0x0C0EA800" />
+        <register type="NOA" address="0x00009888" value="0x020F0002" />
+        <register type="NOA" address="0x00009888" value="0x180F0800" />
+        <register type="NOA" address="0x00009888" value="0x040F0000" />
+        <register type="NOA" address="0x00009888" value="0x060F8000" />
+        <register type="NOA" address="0x00009888" value="0x0A100017" />
+        <register type="NOA" address="0x00009888" value="0x04107113" />
+        <register type="NOA" address="0x00009888" value="0x18100020" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x08100000" />
+        <register type="NOA" address="0x00009888" value="0x08110C40" />
+        <register type="NOA" address="0x00009888" value="0x02110C80" />
+        <register type="NOA" address="0x00009888" value="0x00024000" />
+        <register type="NOA" address="0x00009888" value="0x06028000" />
+        <register type="NOA" address="0x00009888" value="0x0E02C000" />
+        <register type="NOA" address="0x00009888" value="0x00039000" />
+        <register type="NOA" address="0x00009888" value="0x06036000" />
+        <register type="NOA" address="0x00009888" value="0x0803A000" />
+        <register type="NOA" address="0x00009888" value="0x0A032000" />
+        <register type="NOA" address="0x00009888" value="0x0E035000" />
+        <register type="NOA" address="0x00009888" value="0x0203A000" />
+        <register type="NOA" address="0x00009888" value="0x0403A000" />
+        <register type="NOA" address="0x00009888" value="0x00044000" />
+        <register type="NOA" address="0x00009888" value="0x0E044000" />
+        <register type="NOA" address="0x00009888" value="0x10068000" />
+        <register type="NOA" address="0x00009888" value="0x12068000" />
+        <register type="NOA" address="0x00009888" value="0x14068000" />
+        <register type="NOA" address="0x00009888" value="0x02068000" />
+        <register type="NOA" address="0x00009888" value="0x04068000" />
+        <register type="NOA" address="0x00009888" value="0x06068000" />
+        <register type="NOA" address="0x00009888" value="0x08068000" />
+        <register type="NOA" address="0x00009888" value="0x0A068000" />
+        <register type="NOA" address="0x00009888" value="0x0C068000" />
+        <register type="NOA" address="0x00009888" value="0x00070032" />
+        <register type="NOA" address="0x00009888" value="0x0E070033" />
+        <register type="NOA" address="0x00009888" value="0x04070000" />
+        <register type="NOA" address="0x00009888" value="0x08098011" />
+        <register type="NOA" address="0x00009888" value="0x00090980" />
+        <register type="NOA" address="0x00009888" value="0x18090A00" />
+        <register type="NOA" address="0x00009888" value="0x02090000" />
+        <register type="NOA" address="0x00009888" value="0x04098000" />
+        <register type="NOA" address="0x00009888" value="0x06098000" />
+        <register type="NOA" address="0x00009888" value="0x0A098000" />
+        <register type="NOA" address="0x00009888" value="0x0C098000" />
+        <register type="NOA" address="0x00009888" value="0x301F6000" />
+        <register type="NOA" address="0x00009888" value="0x501F36DB" />
+        <register type="NOA" address="0x00009888" value="0x521F491B" />
+        <register type="NOA" address="0x00009888" value="0x541F001B" />
+        <register type="NOA" address="0x00009888" value="0x3A1F6000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F1B41" />
+        <register type="NOA" address="0x00009888" value="0x3E1F2100" />
+        <register type="NOA" address="0x00009888" value="0x461F4141" />
+        <register type="NOA" address="0x00009888" value="0x481F1160" />
+        <register type="NOA" address="0x00009888" value="0x4A1F1000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F2120" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0141" />
+        <register type="NOA" address="0x00009888" value="0x421F1160" />
+        <register type="NOA" address="0x00009888" value="0x441F3111" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="c5cbc488-6569-41dd-9128-42bf6f0d317c"
+       chipset="ICL"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Slice0 Dualsubslice1 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ C 1 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Dualsubslice2 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ C 3 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 Dualsubslice0 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ B 7 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Dualsubslice3 Non-sampler Shader Access Stalled On L3"
+             description="Percentage of time when HDC has messages to L3, but it's stalled due to lack of credits (Slice0 Dualsubslice3)"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ C 5 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader03_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader03AccessStalledOnL3"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x1223000A" />
+        <register type="NOA" address="0x00009888" value="0x10230009" />
+        <register type="NOA" address="0x00009888" value="0x1263000A" />
+        <register type="NOA" address="0x00009888" value="0x10630009" />
+        <register type="NOA" address="0x00009888" value="0x12A3000A" />
+        <register type="NOA" address="0x00009888" value="0x10A30009" />
+        <register type="NOA" address="0x00009888" value="0x12E3000A" />
+        <register type="NOA" address="0x00009888" value="0x10E30009" />
+        <register type="NOA" address="0x00009888" value="0x10150019" />
+        <register type="NOA" address="0x00009888" value="0x1C20000A" />
+        <register type="NOA" address="0x00009888" value="0x0C231900" />
+        <register type="NOA" address="0x00009888" value="0x0E23003C" />
+        <register type="NOA" address="0x00009888" value="0x00230000" />
+        <register type="NOA" address="0x00009888" value="0x1C600020" />
+        <register type="NOA" address="0x00009888" value="0x02608000" />
+        <register type="NOA" address="0x00009888" value="0x0E631900" />
+        <register type="NOA" address="0x00009888" value="0x00631E00" />
+        <register type="NOA" address="0x00009888" value="0x04A08000" />
+        <register type="NOA" address="0x00009888" value="0x06A08000" />
+        <register type="NOA" address="0x00009888" value="0x02A31E32" />
+        <register type="NOA" address="0x00009888" value="0x00A30000" />
+        <register type="NOA" address="0x00009888" value="0x08E08000" />
+        <register type="NOA" address="0x00009888" value="0x0AE08000" />
+        <register type="NOA" address="0x00009888" value="0x04E31E32" />
+        <register type="NOA" address="0x00009888" value="0x00E30000" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x10040150" />
+        <register type="NOA" address="0x00009888" value="0x0E040015" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x14050054" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x24063F00" />
+        <register type="NOA" address="0x00009888" value="0x260600E0" />
+        <register type="NOA" address="0x00009888" value="0x0E088000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x14090040" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x080E5000" />
+        <register type="NOA" address="0x00009888" value="0x1A120020" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x0412C000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0A138000" />
+        <register type="NOA" address="0x00009888" value="0x0413E000" />
+        <register type="NOA" address="0x00009888" value="0x0E148000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x0214C000" />
+        <register type="NOA" address="0x00009888" value="0x00150047" />
+        <register type="NOA" address="0x00009888" value="0x16156000" />
+        <register type="NOA" address="0x00009888" value="0x18150007" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C188000" />
+        <register type="NOA" address="0x00009888" value="0x0E182000" />
+        <register type="NOA" address="0x00009888" value="0x1419000A" />
+        <register type="NOA" address="0x00009888" value="0x021CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A1DA000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3061" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x521F4000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x501F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0100" />
+        <register type="NOA" address="0x00009888" value="0x4C1F3030" />
+        <register type="NOA" address="0x00009888" value="0x401F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F3000" />
+        <register type="NOA" address="0x00009888" value="0x441F3330" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FFFE" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="0316ce4f-e03f-4738-8262-13528fce8eea"
+       chipset="ICL"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Pipe0 PS Output Available"
+             description="The percentage of time in which slice0 pipe0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output00_available"
+             units="percent"
+             symbol_name="PSOutput00Available"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Slice0 Pipe1 PS Output Available"
+             description="The percentage of time in which slice0 pipe1 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output01_available"
+             units="percent"
+             symbol_name="PSOutput01Available"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pipe1 Pixel Values Ready"
+             description="The percentage of time in which slice0 pipe1 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values01_ready"
+             units="percent"
+             symbol_name="PixelValues01Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Pipe0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0  pipe0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data00_ready"
+             units="percent"
+             symbol_name="PixelData00Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Slice0 Pipe1 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0  pipe1 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data01_ready"
+             units="percent"
+             symbol_name="PixelData01Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice0 Pipe0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pipe0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values00_ready"
+             units="percent"
+             symbol_name="PixelValues00Ready"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x140A001F" />
+        <register type="NOA" address="0x00009888" value="0x040C5000" />
+        <register type="NOA" address="0x00009888" value="0x140F001F" />
+        <register type="NOA" address="0x00009888" value="0x04115017" />
+        <register type="NOA" address="0x00009888" value="0x10136000" />
+        <register type="NOA" address="0x00009888" value="0x1213001C" />
+        <register type="NOA" address="0x00009888" value="0x16140000" />
+        <register type="NOA" address="0x00009888" value="0x10160018" />
+        <register type="NOA" address="0x00009888" value="0x101A0018" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045545" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E051000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08051000" />
+        <register type="NOA" address="0x00009888" value="0x2406DF00" />
+        <register type="NOA" address="0x00009888" value="0x26060007" />
+        <register type="NOA" address="0x00009888" value="0x00084000" />
+        <register type="NOA" address="0x00009888" value="0x02084000" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x06094000" />
+        <register type="NOA" address="0x00009888" value="0x000A3080" />
+        <register type="NOA" address="0x00009888" value="0x160A0000" />
+        <register type="NOA" address="0x00009888" value="0x080A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x020C05C0" />
+        <register type="NOA" address="0x00009888" value="0x080C0000" />
+        <register type="NOA" address="0x00009888" value="0x020D1000" />
+        <register type="NOA" address="0x00009888" value="0x040D1000" />
+        <register type="NOA" address="0x00009888" value="0x060E1000" />
+        <register type="NOA" address="0x00009888" value="0x080E1000" />
+        <register type="NOA" address="0x00009888" value="0x020F0061" />
+        <register type="NOA" address="0x00009888" value="0x160F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x08110000" />
+        <register type="NOA" address="0x00009888" value="0x18120C00" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x06128000" />
+        <register type="NOA" address="0x00009888" value="0x0613092F" />
+        <register type="NOA" address="0x00009888" value="0x08134025" />
+        <register type="NOA" address="0x00009888" value="0x0C130000" />
+        <register type="NOA" address="0x00009888" value="0x0413A000" />
+        <register type="NOA" address="0x00009888" value="0x00148066" />
+        <register type="NOA" address="0x00009888" value="0x10140000" />
+        <register type="NOA" address="0x00009888" value="0x0614C000" />
+        <register type="NOA" address="0x00009888" value="0x08144000" />
+        <register type="NOA" address="0x00009888" value="0x0A144000" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x00154000" />
+        <register type="NOA" address="0x00009888" value="0x0E154000" />
+        <register type="NOA" address="0x00009888" value="0x161500E8" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04158000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0C154000" />
+        <register type="NOA" address="0x00009888" value="0x08161000" />
+        <register type="NOA" address="0x00009888" value="0x08184000" />
+        <register type="NOA" address="0x00009888" value="0x12190100" />
+        <register type="NOA" address="0x00009888" value="0x0A1A0020" />
+        <register type="NOA" address="0x00009888" value="0x081A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1C1000" />
+        <register type="NOA" address="0x00009888" value="0x121D0400" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3000" />
+        <register type="NOA" address="0x00009888" value="0x1A1F0061" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4904" />
+        <register type="NOA" address="0x00009888" value="0x521F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x3E1F6000" />
+        <register type="NOA" address="0x00009888" value="0x461F5050" />
+        <register type="NOA" address="0x00009888" value="0x481F1040" />
+        <register type="NOA" address="0x00009888" value="0x401F4010" />
+        <register type="NOA" address="0x00009888" value="0x421F3000" />
+        <register type="NOA" address="0x00009888" value="0x441F5033" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000038" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFEF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="21d69ec3-91e1-48a8-acd6-c0c4ec6e819a"
+       chipset="ICL"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice0 L3 Bank5 Active"
+             description="The percentage of time in which slice0 L3 bank5 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank5_active"
+             units="percent"
+             symbol_name="L30Bank5Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank6 Active"
+             description="The percentage of time in which slice0 L3 bank6 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank6_active"
+             units="percent"
+             symbol_name="L30Bank6Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 L3 Bank7 Active"
+             description="The percentage of time in which slice0 L3 bank7 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank7_active"
+             units="percent"
+             symbol_name="L30Bank7Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 L3 Bank4 Active"
+             description="The percentage of time in which slice0 L3 bank4 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank4_active"
+             units="percent"
+             symbol_name="L30Bank4Active"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x17340000" />
+        <register type="NOA" address="0x00009888" value="0x17740000" />
+        <register type="NOA" address="0x00009888" value="0x17B40000" />
+        <register type="NOA" address="0x00009888" value="0x17F40000" />
+        <register type="NOA" address="0x00009888" value="0x16340000" />
+        <register type="NOA" address="0x00009888" value="0x16740000" />
+        <register type="NOA" address="0x00009888" value="0x16B40000" />
+        <register type="NOA" address="0x00009888" value="0x16F40000" />
+        <register type="NOA" address="0x00009888" value="0x07340037" />
+        <register type="NOA" address="0x00009888" value="0x21340000" />
+        <register type="NOA" address="0x00009888" value="0x09740037" />
+        <register type="NOA" address="0x00009888" value="0x21740000" />
+        <register type="NOA" address="0x00009888" value="0x0BB40037" />
+        <register type="NOA" address="0x00009888" value="0x21B40000" />
+        <register type="NOA" address="0x00009888" value="0x0DF40037" />
+        <register type="NOA" address="0x00009888" value="0x21F40000" />
+        <register type="NOA" address="0x00009888" value="0x0E0000A7" />
+        <register type="NOA" address="0x00009888" value="0x08012000" />
+        <register type="NOA" address="0x00009888" value="0x0A034000" />
+        <register type="NOA" address="0x00009888" value="0x0C038000" />
+        <register type="NOA" address="0x00009888" value="0x1C340037" />
+        <register type="NOA" address="0x00009888" value="0x20340000" />
+        <register type="NOA" address="0x00009888" value="0x1E740037" />
+        <register type="NOA" address="0x00009888" value="0x20740000" />
+        <register type="NOA" address="0x00009888" value="0x02B40037" />
+        <register type="NOA" address="0x00009888" value="0x20B40000" />
+        <register type="NOA" address="0x00009888" value="0x04F40037" />
+        <register type="NOA" address="0x00009888" value="0x20F40000" />
+        <register type="NOA" address="0x00009888" value="0x10040200" />
+        <register type="NOA" address="0x00009888" value="0x0E040055" />
+        <register type="NOA" address="0x00009888" value="0x14050070" />
+        <register type="NOA" address="0x00009888" value="0x04058000" />
+        <register type="NOA" address="0x00009888" value="0x06056000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600C0" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x02074000" />
+        <register type="NOA" address="0x00009888" value="0x04078000" />
+        <register type="NOA" address="0x00009888" value="0x06124000" />
+        <register type="NOA" address="0x00009888" value="0x08124000" />
+        <register type="NOA" address="0x00009888" value="0x0A124000" />
+        <register type="NOA" address="0x00009888" value="0x0C124000" />
+        <register type="NOA" address="0x00009888" value="0x04138000" />
+        <register type="NOA" address="0x00009888" value="0x06137000" />
+        <register type="NOA" address="0x00009888" value="0x02148000" />
+        <register type="NOA" address="0x00009888" value="0x0414C000" />
+        <register type="NOA" address="0x00009888" value="0x06144000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08154000" />
+        <register type="NOA" address="0x00009888" value="0x0A154000" />
+        <register type="NOA" address="0x00009888" value="0x0C154000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3000" />
+        <register type="NOA" address="0x00009888" value="0x2A1F0061" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x521F0000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2460" />
+        <register type="NOA" address="0x00009888" value="0x501F0124" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0133" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F6060" />
+        <register type="NOA" address="0x00009888" value="0x421F0010" />
+        <register type="NOA" address="0x00009888" value="0x441F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank0 stalled metric set"
+       mdapi_supported_apis="OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="e60e9155-6830-4aec-baf2-1c3c15a73869"
+       chipset="ICL"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD B 2 READ FADD B 3 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10050C00" />
+        <register type="NOA" address="0x00009888" value="0x12050002" />
+        <register type="NOA" address="0x00009888" value="0x00050025" />
+        <register type="NOA" address="0x00009888" value="0x06050900" />
+        <register type="NOA" address="0x00009888" value="0x080508EA" />
+        <register type="NOA" address="0x00009888" value="0x0A0508AB" />
+        <register type="NOA" address="0x00009888" value="0x0C050A21" />
+        <register type="NOA" address="0x00009888" value="0x0E050A60" />
+        <register type="NOA" address="0x00009888" value="0x04050000" />
+        <register type="NOA" address="0x00009888" value="0x14050000" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank1 stalled metric set"
+       mdapi_supported_apis="OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="47c364d5-1799-4d17-9447-add9358c6451"
+       chipset="ICL"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD B 2 READ FADD B 3 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10050400" />
+        <register type="NOA" address="0x00009888" value="0x12050000" />
+        <register type="NOA" address="0x00009888" value="0x00050025" />
+        <register type="NOA" address="0x00009888" value="0x06050900" />
+        <register type="NOA" address="0x00009888" value="0x080508EA" />
+        <register type="NOA" address="0x00009888" value="0x0A0508AB" />
+        <register type="NOA" address="0x00009888" value="0x0C050A21" />
+        <register type="NOA" address="0x00009888" value="0x0E050A60" />
+        <register type="NOA" address="0x00009888" value="0x04050000" />
+        <register type="NOA" address="0x00009888" value="0x14050000" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank4 stalled metric set"
+       mdapi_supported_apis="OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_4"
+       hw_config_guid="e5ab5c08-3130-4469-8eaf-b23d3dc817d4"
+       chipset="ICL"
+       symbol_name="L3_4"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 L3 Bank4 Stalled"
+             description="The percentage of time in which slice0 L3 bank4 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD B 2 READ FADD B 3 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank4_stalled"
+             units="percent"
+             symbol_name="L30Bank4Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10010C00" />
+        <register type="NOA" address="0x00009888" value="0x12010002" />
+        <register type="NOA" address="0x00009888" value="0x0C000400" />
+        <register type="NOA" address="0x00009888" value="0x0E005500" />
+        <register type="NOA" address="0x00009888" value="0x10000155" />
+        <register type="NOA" address="0x00009888" value="0x00010025" />
+        <register type="NOA" address="0x00009888" value="0x06010900" />
+        <register type="NOA" address="0x00009888" value="0x080108EA" />
+        <register type="NOA" address="0x00009888" value="0x0A0108AB" />
+        <register type="NOA" address="0x00009888" value="0x0C010A21" />
+        <register type="NOA" address="0x00009888" value="0x0E010A60" />
+        <register type="NOA" address="0x00009888" value="0x04010000" />
+        <register type="NOA" address="0x00009888" value="0x14010000" />
+        <register type="NOA" address="0x00009888" value="0x0C040400" />
+        <register type="NOA" address="0x00009888" value="0x0E045500" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04051000" />
+        <register type="NOA" address="0x00009888" value="0x0A054000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x00124000" />
+        <register type="NOA" address="0x00009888" value="0x0E124000" />
+        <register type="NOA" address="0x00009888" value="0x18125540" />
+        <register type="NOA" address="0x00009888" value="0x1A120015" />
+        <register type="NOA" address="0x00009888" value="0x04131000" />
+        <register type="NOA" address="0x00009888" value="0x06138000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x00144000" />
+        <register type="NOA" address="0x00009888" value="0x06148000" />
+        <register type="NOA" address="0x00009888" value="0x0814C000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00154000" />
+        <register type="NOA" address="0x00009888" value="0x0E154000" />
+        <register type="NOA" address="0x00009888" value="0x16152AA8" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Gen11 L2Bank5 stalled metric set"
+       mdapi_supported_apis="OGL OGL4 OCL MEDIA IO BB"
+       underscore_name="l3_5"
+       hw_config_guid="6cdf23c1-f725-414c-959a-c90fa5571b1f"
+       chipset="ICL"
+       symbol_name="L3_5"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank5 Stalled"
+             description="The percentage of time in which slice0 L3 bank5 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ B 3 READ FADD B 0 READ FADD B 1 READ FADD 4 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank5_stalled"
+             units="percent"
+             symbol_name="L30Bank5Stalled"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x10010400" />
+        <register type="NOA" address="0x00009888" value="0x12010000" />
+        <register type="NOA" address="0x00009888" value="0x0C000400" />
+        <register type="NOA" address="0x00009888" value="0x0E005500" />
+        <register type="NOA" address="0x00009888" value="0x10000155" />
+        <register type="NOA" address="0x00009888" value="0x00010022" />
+        <register type="NOA" address="0x00009888" value="0x06010840" />
+        <register type="NOA" address="0x00009888" value="0x08010828" />
+        <register type="NOA" address="0x00009888" value="0x0A010969" />
+        <register type="NOA" address="0x00009888" value="0x0C010AA4" />
+        <register type="NOA" address="0x00009888" value="0x0E010AE3" />
+        <register type="NOA" address="0x00009888" value="0x04010000" />
+        <register type="NOA" address="0x00009888" value="0x14010000" />
+        <register type="NOA" address="0x00009888" value="0x0C040400" />
+        <register type="NOA" address="0x00009888" value="0x0E045500" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04051000" />
+        <register type="NOA" address="0x00009888" value="0x0A054000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x24068100" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x00124000" />
+        <register type="NOA" address="0x00009888" value="0x0E124000" />
+        <register type="NOA" address="0x00009888" value="0x18125540" />
+        <register type="NOA" address="0x00009888" value="0x1A120015" />
+        <register type="NOA" address="0x00009888" value="0x04131000" />
+        <register type="NOA" address="0x00009888" value="0x06138000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x00144000" />
+        <register type="NOA" address="0x00009888" value="0x06148000" />
+        <register type="NOA" address="0x00009888" value="0x0814C000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00154000" />
+        <register type="NOA" address="0x00009888" value="0x0E154000" />
+        <register type="NOA" address="0x00009888" value="0x16152AA8" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4800" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3E1F0000" />
+        <register type="NOA" address="0x00009888" value="0x461F0000" />
+        <register type="NOA" address="0x00009888" value="0x481F0000" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000022" />
+        <register type="OA" address="0x00002774" value="0x0000FFF8" />
+        <register type="OA" address="0x00002778" value="0x00000082" />
+        <register type="OA" address="0x0000277C" value="0x0000FFE7" />
+        <register type="OA" address="0x00002780" value="0x00000402" />
+        <register type="OA" address="0x00002784" value="0x0000FF1F" />
+        <register type="OA" address="0x00002788" value="0x00001002" />
+        <register type="OA" address="0x0000278C" value="0x0000FCFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+        <register type="FLEX" address="0x0000E658" value="0x00011010" />
+        <register type="FLEX" address="0x0000E758" value="0x00050012" />
+        <register type="FLEX" address="0x0000E45C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000053" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler 1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler_1"
+       hw_config_guid="51a2eb6d-9fad-4489-8f22-ab845fe7882a"
+       chipset="ICL"
+       symbol_name="Sampler_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice0 Subslice6 Input Available"
+             description="The percentage of time in which slice0 subslice6 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler06_input_available"
+             units="percent"
+             symbol_name="Sampler06InputAvailable"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice4 Input Available"
+             description="The percentage of time in which slice0 subslice4 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler04_input_available"
+             units="percent"
+             symbol_name="Sampler04InputAvailable"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice0 Subslice3 Input Available"
+             description="The percentage of time in which slice0 subslice3 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler03_input_available"
+             units="percent"
+             symbol_name="Sampler03InputAvailable"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice5 Input Available"
+             description="The percentage of time in which slice0 subslice5 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler05_input_available"
+             units="percent"
+             symbol_name="Sampler05InputAvailable"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice7 Input Available"
+             description="The percentage of time in which slice0 subslice7 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler07_input_available"
+             units="percent"
+             symbol_name="Sampler07InputAvailable"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x142A0165" />
+        <register type="NOA" address="0x00009888" value="0x142F0165" />
+        <register type="NOA" address="0x00009888" value="0x146A0165" />
+        <register type="NOA" address="0x00009888" value="0x146F0165" />
+        <register type="NOA" address="0x00009888" value="0x14AA0165" />
+        <register type="NOA" address="0x00009888" value="0x14AF0165" />
+        <register type="NOA" address="0x00009888" value="0x14EA0165" />
+        <register type="NOA" address="0x00009888" value="0x14EF0165" />
+        <register type="NOA" address="0x00009888" value="0x161E8000" />
+        <register type="NOA" address="0x00009888" value="0x181EC000" />
+        <register type="NOA" address="0x00009888" value="0x1A1E0400" />
+        <register type="NOA" address="0x00009888" value="0x061F8000" />
+        <register type="NOA" address="0x00009888" value="0x081F8000" />
+        <register type="NOA" address="0x00009888" value="0x0A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0400" />
+        <register type="NOA" address="0x00009888" value="0x06204000" />
+        <register type="NOA" address="0x00009888" value="0x08204000" />
+        <register type="NOA" address="0x00009888" value="0x0A204000" />
+        <register type="NOA" address="0x00009888" value="0x0C204000" />
+        <register type="NOA" address="0x00009888" value="0x06218000" />
+        <register type="NOA" address="0x00009888" value="0x08218000" />
+        <register type="NOA" address="0x00009888" value="0x0A218000" />
+        <register type="NOA" address="0x00009888" value="0x0C218000" />
+        <register type="NOA" address="0x00009888" value="0x042A1800" />
+        <register type="NOA" address="0x00009888" value="0x062AC038" />
+        <register type="NOA" address="0x00009888" value="0x102A0000" />
+        <register type="NOA" address="0x00009888" value="0x082AC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2A0000" />
+        <register type="NOA" address="0x00009888" value="0x0C2A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x182C0002" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x042F0048" />
+        <register type="NOA" address="0x00009888" value="0x102F0000" />
+        <register type="NOA" address="0x00009888" value="0x1C5E000C" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x145E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5F000C" />
+        <register type="NOA" address="0x00009888" value="0x025F8000" />
+        <register type="NOA" address="0x00009888" value="0x045F8000" />
+        <register type="NOA" address="0x00009888" value="0x1C600014" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x04604000" />
+        <register type="NOA" address="0x00009888" value="0x16612800" />
+        <register type="NOA" address="0x00009888" value="0x02618000" />
+        <register type="NOA" address="0x00009888" value="0x04618000" />
+        <register type="NOA" address="0x00009888" value="0x006A1800" />
+        <register type="NOA" address="0x00009888" value="0x026A0038" />
+        <register type="NOA" address="0x00009888" value="0x106A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A00F0" />
+        <register type="NOA" address="0x00009888" value="0x046A0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C000A" />
+        <register type="NOA" address="0x00009888" value="0x066C8000" />
+        <register type="NOA" address="0x00009888" value="0x086C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6F2440" />
+        <register type="NOA" address="0x00009888" value="0x106F0000" />
+        <register type="NOA" address="0x00009888" value="0x1A9EC000" />
+        <register type="NOA" address="0x00009888" value="0x1C9E0003" />
+        <register type="NOA" address="0x00009888" value="0x0C9FC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0003" />
+        <register type="NOA" address="0x00009888" value="0x1AA02A00" />
+        <register type="NOA" address="0x00009888" value="0x1CA00001" />
+        <register type="NOA" address="0x00009888" value="0x16A102A8" />
+        <register type="NOA" address="0x00009888" value="0x0CAA1C30" />
+        <register type="NOA" address="0x00009888" value="0x10AA0000" />
+        <register type="NOA" address="0x00009888" value="0x18AAF000" />
+        <register type="NOA" address="0x00009888" value="0x1AAA0000" />
+        <register type="NOA" address="0x00009888" value="0x18ACAA00" />
+        <register type="NOA" address="0x00009888" value="0x0AAF2440" />
+        <register type="NOA" address="0x00009888" value="0x10AF0000" />
+        <register type="NOA" address="0x00009888" value="0x10DE8000" />
+        <register type="NOA" address="0x00009888" value="0x1ADE3800" />
+        <register type="NOA" address="0x00009888" value="0x00DF8000" />
+        <register type="NOA" address="0x00009888" value="0x0CDF3800" />
+        <register type="NOA" address="0x00009888" value="0x00E04000" />
+        <register type="NOA" address="0x00009888" value="0x0EE04000" />
+        <register type="NOA" address="0x00009888" value="0x1AE000A0" />
+        <register type="NOA" address="0x00009888" value="0x00E18000" />
+        <register type="NOA" address="0x00009888" value="0x0EE18000" />
+        <register type="NOA" address="0x00009888" value="0x14E18000" />
+        <register type="NOA" address="0x00009888" value="0x16E10002" />
+        <register type="NOA" address="0x00009888" value="0x08EA1C30" />
+        <register type="NOA" address="0x00009888" value="0x10EA0000" />
+        <register type="NOA" address="0x00009888" value="0x00EAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EEAC000" />
+        <register type="NOA" address="0x00009888" value="0x18EA0000" />
+        <register type="NOA" address="0x00009888" value="0x04EC8000" />
+        <register type="NOA" address="0x00009888" value="0x18EC00A8" />
+        <register type="NOA" address="0x00009888" value="0x00EF0040" />
+        <register type="NOA" address="0x00009888" value="0x06EF2400" />
+        <register type="NOA" address="0x00009888" value="0x10EF0000" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FF00" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x0E08A000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x02082000" />
+        <register type="NOA" address="0x00009888" value="0x14090050" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x06091000" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x040E1000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E4000" />
+        <register type="NOA" address="0x00009888" value="0x0C0E5000" />
+        <register type="NOA" address="0x00009888" value="0x1812FC00" />
+        <register type="NOA" address="0x00009888" value="0x1A12002B" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x04128000" />
+        <register type="NOA" address="0x00009888" value="0x0813C000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x00158000" />
+        <register type="NOA" address="0x00009888" value="0x0E158000" />
+        <register type="NOA" address="0x00009888" value="0x16152AD0" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x0615C000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A15C000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x02188000" />
+        <register type="NOA" address="0x00009888" value="0x0418A000" />
+        <register type="NOA" address="0x00009888" value="0x06182000" />
+        <register type="NOA" address="0x00009888" value="0x0A198000" />
+        <register type="NOA" address="0x00009888" value="0x0C19A000" />
+        <register type="NOA" address="0x00009888" value="0x0E192000" />
+        <register type="NOA" address="0x00009888" value="0x0A1CA000" />
+        <register type="NOA" address="0x00009888" value="0x0C1CA000" />
+        <register type="NOA" address="0x00009888" value="0x121D5400" />
+        <register type="NOA" address="0x00009888" value="0x141D0002" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x3E1F3000" />
+        <register type="NOA" address="0x00009888" value="0x461F4030" />
+        <register type="NOA" address="0x00009888" value="0x481F0040" />
+        <register type="NOA" address="0x00009888" value="0x4A1F1000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0010" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F1010" />
+        <register type="NOA" address="0x00009888" value="0x421F3030" />
+        <register type="NOA" address="0x00009888" value="0x441F4040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000018" />
+        <register type="OA" address="0x00002774" value="0x0000FFFC" />
+        <register type="OA" address="0x00002778" value="0x00000060" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF3" />
+        <register type="OA" address="0x00002780" value="0x00000180" />
+        <register type="OA" address="0x00002784" value="0x0000FFCF" />
+        <register type="OA" address="0x00002788" value="0x00000600" />
+        <register type="OA" address="0x0000278C" value="0x0000FF3F" />
+        <register type="OA" address="0x00002790" value="0x00001800" />
+        <register type="OA" address="0x00002794" value="0x0000FCFF" />
+        <register type="OA" address="0x00002798" value="0x00006000" />
+        <register type="OA" address="0x0000279C" value="0x0000F3FF" />
+        <register type="OA" address="0x000027A0" value="0x00018000" />
+        <register type="OA" address="0x000027A4" value="0x0000CFFF" />
+        <register type="OA" address="0x000027A8" value="0x00060000" />
+        <register type="OA" address="0x000027AC" value="0x00003FFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler 2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler_2"
+       hw_config_guid="afc0f021-8c33-4d60-803d-93487f96c7c1"
+       chipset="ICL"
+       symbol_name="Sampler_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Subslice6 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice6 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler06_output_ready"
+             units="percent"
+             symbol_name="Sampler06OutputReady"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice4 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice4 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler04_output_ready"
+             units="percent"
+             symbol_name="Sampler04OutputReady"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Slice0 Subslice3 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice3 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler03_output_ready"
+             units="percent"
+             symbol_name="Sampler03OutputReady"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice7 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice7 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler07_output_ready"
+             units="percent"
+             symbol_name="Sampler07OutputReady"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Slice0 Subslice5 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice5 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler05_output_ready"
+             units="percent"
+             symbol_name="Sampler05OutputReady"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x142D0005" />
+        <register type="NOA" address="0x00009888" value="0x14320005" />
+        <register type="NOA" address="0x00009888" value="0x146D0005" />
+        <register type="NOA" address="0x00009888" value="0x14720005" />
+        <register type="NOA" address="0x00009888" value="0x14AD0005" />
+        <register type="NOA" address="0x00009888" value="0x14B20005" />
+        <register type="NOA" address="0x00009888" value="0x14ED0005" />
+        <register type="NOA" address="0x00009888" value="0x14F20005" />
+        <register type="NOA" address="0x00009888" value="0x1C1E000C" />
+        <register type="NOA" address="0x00009888" value="0x0E1F000C" />
+        <register type="NOA" address="0x00009888" value="0x1C200014" />
+        <register type="NOA" address="0x00009888" value="0x16212800" />
+        <register type="NOA" address="0x00009888" value="0x22290010" />
+        <register type="NOA" address="0x00009888" value="0x1A2A00D0" />
+        <register type="NOA" address="0x00009888" value="0x1A2C000A" />
+        <register type="NOA" address="0x00009888" value="0x0E2D0033" />
+        <register type="NOA" address="0x00009888" value="0x022D0000" />
+        <register type="NOA" address="0x00009888" value="0x0E2F8000" />
+        <register type="NOA" address="0x00009888" value="0x1E300080" />
+        <register type="NOA" address="0x00009888" value="0x1A310008" />
+        <register type="NOA" address="0x00009888" value="0x0E321980" />
+        <register type="NOA" address="0x00009888" value="0x02320000" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x145E8000" />
+        <register type="NOA" address="0x00009888" value="0x025F8000" />
+        <register type="NOA" address="0x00009888" value="0x045F8000" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x04604000" />
+        <register type="NOA" address="0x00009888" value="0x02618000" />
+        <register type="NOA" address="0x00009888" value="0x04618000" />
+        <register type="NOA" address="0x00009888" value="0x12698000" />
+        <register type="NOA" address="0x00009888" value="0x026A4000" />
+        <register type="NOA" address="0x00009888" value="0x046AC000" />
+        <register type="NOA" address="0x00009888" value="0x066C8000" />
+        <register type="NOA" address="0x00009888" value="0x086C8000" />
+        <register type="NOA" address="0x00009888" value="0x006D1980" />
+        <register type="NOA" address="0x00009888" value="0x026D0000" />
+        <register type="NOA" address="0x00009888" value="0x026F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A702000" />
+        <register type="NOA" address="0x00009888" value="0x08718000" />
+        <register type="NOA" address="0x00009888" value="0x02720033" />
+        <register type="NOA" address="0x00009888" value="0x169E8000" />
+        <register type="NOA" address="0x00009888" value="0x189E4000" />
+        <register type="NOA" address="0x00009888" value="0x069F8000" />
+        <register type="NOA" address="0x00009888" value="0x089F8000" />
+        <register type="NOA" address="0x00009888" value="0x06A04000" />
+        <register type="NOA" address="0x00009888" value="0x08A04000" />
+        <register type="NOA" address="0x00009888" value="0x06A18000" />
+        <register type="NOA" address="0x00009888" value="0x08A18000" />
+        <register type="NOA" address="0x00009888" value="0x16A98000" />
+        <register type="NOA" address="0x00009888" value="0x06AA4000" />
+        <register type="NOA" address="0x00009888" value="0x08AAC000" />
+        <register type="NOA" address="0x00009888" value="0x0AAC8000" />
+        <register type="NOA" address="0x00009888" value="0x0CAC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AD1980" />
+        <register type="NOA" address="0x00009888" value="0x04AF4000" />
+        <register type="NOA" address="0x00009888" value="0x1CB00002" />
+        <register type="NOA" address="0x00009888" value="0x0CB18000" />
+        <register type="NOA" address="0x00009888" value="0x04B20033" />
+        <register type="NOA" address="0x00009888" value="0x02B20000" />
+        <register type="NOA" address="0x00009888" value="0x18DE8000" />
+        <register type="NOA" address="0x00009888" value="0x1ADE0400" />
+        <register type="NOA" address="0x00009888" value="0x0ADF8000" />
+        <register type="NOA" address="0x00009888" value="0x0CDF0400" />
+        <register type="NOA" address="0x00009888" value="0x0AE04000" />
+        <register type="NOA" address="0x00009888" value="0x0CE04000" />
+        <register type="NOA" address="0x00009888" value="0x0AE18000" />
+        <register type="NOA" address="0x00009888" value="0x0CE18000" />
+        <register type="NOA" address="0x00009888" value="0x1EE98000" />
+        <register type="NOA" address="0x00009888" value="0x0AEA4000" />
+        <register type="NOA" address="0x00009888" value="0x0CEAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EEC8000" />
+        <register type="NOA" address="0x00009888" value="0x18EC0002" />
+        <register type="NOA" address="0x00009888" value="0x04ED1980" />
+        <register type="NOA" address="0x00009888" value="0x02ED0000" />
+        <register type="NOA" address="0x00009888" value="0x06EF4000" />
+        <register type="NOA" address="0x00009888" value="0x1CF00020" />
+        <register type="NOA" address="0x00009888" value="0x18F10002" />
+        <register type="NOA" address="0x00009888" value="0x06F20033" />
+        <register type="NOA" address="0x00009888" value="0x02F20000" />
+        <register type="NOA" address="0x00009888" value="0x10040140" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E040055" />
+        <register type="NOA" address="0x00009888" value="0x14050050" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x0A051000" />
+        <register type="NOA" address="0x00009888" value="0x260600C0" />
+        <register type="NOA" address="0x00009888" value="0x24067E00" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x02082000" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x06091000" />
+        <register type="NOA" address="0x00009888" value="0x040D8000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x080E4000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E1000" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x04128000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0812C000" />
+        <register type="NOA" address="0x00009888" value="0x0413E000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x0214C000" />
+        <register type="NOA" address="0x00009888" value="0x04144000" />
+        <register type="NOA" address="0x00009888" value="0x1815000F" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08154000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C158000" />
+        <register type="NOA" address="0x00009888" value="0x0E18A000" />
+        <register type="NOA" address="0x00009888" value="0x14190028" />
+        <register type="NOA" address="0x00009888" value="0x021C8000" />
+        <register type="NOA" address="0x00009888" value="0x041C2000" />
+        <register type="NOA" address="0x00009888" value="0x0A1D8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1D2000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3000" />
+        <register type="NOA" address="0x00009888" value="0x2A1F0061" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x521F0000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2430" />
+        <register type="NOA" address="0x00009888" value="0x501F0124" />
+        <register type="NOA" address="0x00009888" value="0x4C1F5047" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0020" />
+        <register type="NOA" address="0x00009888" value="0x421F0020" />
+        <register type="NOA" address="0x00009888" value="0x441F3050" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="eddc2f32-b196-4a72-9bf8-21770e35f8bd"
+       chipset="ICL"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice3 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice3 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread03_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread03ReadyForDispatch"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 20 READ A 6 READ UDIV"
+             underscore_name="ps_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="PsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS AVG Stall per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were stalled on the EUs."
+             data_type="uint64"
+             equation="A 14 READ A 1 READ UDIV"
+             underscore_name="vs_eu_stall_per_thread"
+             units="cycles"
+             symbol_name="VsEuStallPerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which fragment shaders were processed actively on the EUs."
+             data_type="uint64"
+             equation="A 19 READ A 6 READ UDIV"
+             underscore_name="ps_eu_active_per_thread"
+             units="cycles"
+             symbol_name="PsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="FS EU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_active"
+             units="percent"
+             symbol_name="PsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice7 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice7 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread07_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread07ReadyForDispatch"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="FS EU Stall"
+             description="The percentage of time in which fragment shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_stall"
+             units="percent"
+             symbol_name="PsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice5 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice5 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread05_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread05ReadyForDispatch"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS EU Active"
+             description="The percentage of time in which vertex shaders were processed actively on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_active"
+             units="percent"
+             symbol_name="VsEuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice4 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice4 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread04_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread04ReadyForDispatch"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS EU Stall"
+             description="The percentage of time in which vertex shaders were stalled on the EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_eu_stall"
+             units="percent"
+             symbol_name="VsEuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="VS AVG Active per Thread"
+             description="The average number of cycles per hardware thread run in which vertex shaders were processed actively on the EUs."
+             data_type="uint64"
+             equation="A 13 READ A 1 READ UDIV"
+             underscore_name="vs_eu_active_per_thread"
+             units="cycles"
+             symbol_name="VsEuActivePerThread"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice6 Thread Dispatcher"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice6 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread06_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread06ReadyForDispatch"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14290000" />
+        <register type="NOA" address="0x00009888" value="0x142E0000" />
+        <register type="NOA" address="0x00009888" value="0x14690000" />
+        <register type="NOA" address="0x00009888" value="0x146E0000" />
+        <register type="NOA" address="0x00009888" value="0x14A90000" />
+        <register type="NOA" address="0x00009888" value="0x14AE0000" />
+        <register type="NOA" address="0x00009888" value="0x14E90000" />
+        <register type="NOA" address="0x00009888" value="0x14EE0000" />
+        <register type="NOA" address="0x00009888" value="0x161E8000" />
+        <register type="NOA" address="0x00009888" value="0x181EC000" />
+        <register type="NOA" address="0x00009888" value="0x1A1E0400" />
+        <register type="NOA" address="0x00009888" value="0x061F8000" />
+        <register type="NOA" address="0x00009888" value="0x081F8000" />
+        <register type="NOA" address="0x00009888" value="0x0A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F0400" />
+        <register type="NOA" address="0x00009888" value="0x06204000" />
+        <register type="NOA" address="0x00009888" value="0x08204000" />
+        <register type="NOA" address="0x00009888" value="0x0A204000" />
+        <register type="NOA" address="0x00009888" value="0x0C204000" />
+        <register type="NOA" address="0x00009888" value="0x06218000" />
+        <register type="NOA" address="0x00009888" value="0x08218000" />
+        <register type="NOA" address="0x00009888" value="0x0A218000" />
+        <register type="NOA" address="0x00009888" value="0x0C218000" />
+        <register type="NOA" address="0x00009888" value="0x0429C300" />
+        <register type="NOA" address="0x00009888" value="0x062900C5" />
+        <register type="NOA" address="0x00009888" value="0x22290000" />
+        <register type="NOA" address="0x00009888" value="0x1E290000" />
+        <register type="NOA" address="0x00009888" value="0x20290000" />
+        <register type="NOA" address="0x00009888" value="0x062AC000" />
+        <register type="NOA" address="0x00009888" value="0x082AC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2A4000" />
+        <register type="NOA" address="0x00009888" value="0x0C2A4000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x182C0002" />
+        <register type="NOA" address="0x00009888" value="0x022EC300" />
+        <register type="NOA" address="0x00009888" value="0x042E00C5" />
+        <register type="NOA" address="0x00009888" value="0x102E0000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F4000" />
+        <register type="NOA" address="0x00009888" value="0x1A304000" />
+        <register type="NOA" address="0x00009888" value="0x1C300001" />
+        <register type="NOA" address="0x00009888" value="0x1C5E000C" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x145E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5F000C" />
+        <register type="NOA" address="0x00009888" value="0x025F8000" />
+        <register type="NOA" address="0x00009888" value="0x045F8000" />
+        <register type="NOA" address="0x00009888" value="0x1C600014" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x04604000" />
+        <register type="NOA" address="0x00009888" value="0x16612800" />
+        <register type="NOA" address="0x00009888" value="0x02618000" />
+        <register type="NOA" address="0x00009888" value="0x04618000" />
+        <register type="NOA" address="0x00009888" value="0x0069C300" />
+        <register type="NOA" address="0x00009888" value="0x026900C5" />
+        <register type="NOA" address="0x00009888" value="0x22690000" />
+        <register type="NOA" address="0x00009888" value="0x12690000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A00F0" />
+        <register type="NOA" address="0x00009888" value="0x026A4000" />
+        <register type="NOA" address="0x00009888" value="0x046A4000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C000A" />
+        <register type="NOA" address="0x00009888" value="0x066C8000" />
+        <register type="NOA" address="0x00009888" value="0x086C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6EC5C3" />
+        <register type="NOA" address="0x00009888" value="0x106E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E6FC000" />
+        <register type="NOA" address="0x00009888" value="0x1E700050" />
+        <register type="NOA" address="0x00009888" value="0x1A9EC000" />
+        <register type="NOA" address="0x00009888" value="0x1C9E0003" />
+        <register type="NOA" address="0x00009888" value="0x0C9FC000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F0003" />
+        <register type="NOA" address="0x00009888" value="0x1AA02A00" />
+        <register type="NOA" address="0x00009888" value="0x1CA00001" />
+        <register type="NOA" address="0x00009888" value="0x16A102A8" />
+        <register type="NOA" address="0x00009888" value="0x0CA9C5C3" />
+        <register type="NOA" address="0x00009888" value="0x22A90000" />
+        <register type="NOA" address="0x00009888" value="0x18AAF000" />
+        <register type="NOA" address="0x00009888" value="0x1AAA0005" />
+        <register type="NOA" address="0x00009888" value="0x18ACAA00" />
+        <register type="NOA" address="0x00009888" value="0x0AAEC5C3" />
+        <register type="NOA" address="0x00009888" value="0x10AE0000" />
+        <register type="NOA" address="0x00009888" value="0x0AAFC000" />
+        <register type="NOA" address="0x00009888" value="0x1CB05000" />
+        <register type="NOA" address="0x00009888" value="0x10DE8000" />
+        <register type="NOA" address="0x00009888" value="0x1ADE3800" />
+        <register type="NOA" address="0x00009888" value="0x00DF8000" />
+        <register type="NOA" address="0x00009888" value="0x0CDF3800" />
+        <register type="NOA" address="0x00009888" value="0x00E04000" />
+        <register type="NOA" address="0x00009888" value="0x0EE04000" />
+        <register type="NOA" address="0x00009888" value="0x1AE000A0" />
+        <register type="NOA" address="0x00009888" value="0x00E18000" />
+        <register type="NOA" address="0x00009888" value="0x0EE18000" />
+        <register type="NOA" address="0x00009888" value="0x14E18000" />
+        <register type="NOA" address="0x00009888" value="0x16E10002" />
+        <register type="NOA" address="0x00009888" value="0x08E9C5C3" />
+        <register type="NOA" address="0x00009888" value="0x22E90000" />
+        <register type="NOA" address="0x00009888" value="0x20E90000" />
+        <register type="NOA" address="0x00009888" value="0x00EAC000" />
+        <register type="NOA" address="0x00009888" value="0x0EEAC000" />
+        <register type="NOA" address="0x00009888" value="0x18EA0500" />
+        <register type="NOA" address="0x00009888" value="0x04EC8000" />
+        <register type="NOA" address="0x00009888" value="0x18EC00A8" />
+        <register type="NOA" address="0x00009888" value="0x00EE00C3" />
+        <register type="NOA" address="0x00009888" value="0x06EEC500" />
+        <register type="NOA" address="0x00009888" value="0x10EE0000" />
+        <register type="NOA" address="0x00009888" value="0x00EF4000" />
+        <register type="NOA" address="0x00009888" value="0x06EF8000" />
+        <register type="NOA" address="0x00009888" value="0x18F04000" />
+        <register type="NOA" address="0x00009888" value="0x1CF00040" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FF00" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x0E08A000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x02082000" />
+        <register type="NOA" address="0x00009888" value="0x14090050" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x06091000" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x040E1000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E4000" />
+        <register type="NOA" address="0x00009888" value="0x0C0E5000" />
+        <register type="NOA" address="0x00009888" value="0x1812FC00" />
+        <register type="NOA" address="0x00009888" value="0x1A12002B" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x04128000" />
+        <register type="NOA" address="0x00009888" value="0x0813C000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x00158000" />
+        <register type="NOA" address="0x00009888" value="0x0E158000" />
+        <register type="NOA" address="0x00009888" value="0x16152AD0" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x0615C000" />
+        <register type="NOA" address="0x00009888" value="0x0815C000" />
+        <register type="NOA" address="0x00009888" value="0x0A15C000" />
+        <register type="NOA" address="0x00009888" value="0x0C15C000" />
+        <register type="NOA" address="0x00009888" value="0x02188000" />
+        <register type="NOA" address="0x00009888" value="0x0418A000" />
+        <register type="NOA" address="0x00009888" value="0x06182000" />
+        <register type="NOA" address="0x00009888" value="0x0A198000" />
+        <register type="NOA" address="0x00009888" value="0x0C19A000" />
+        <register type="NOA" address="0x00009888" value="0x0E192000" />
+        <register type="NOA" address="0x00009888" value="0x0A1CA000" />
+        <register type="NOA" address="0x00009888" value="0x0C1CA000" />
+        <register type="NOA" address="0x00009888" value="0x121D5400" />
+        <register type="NOA" address="0x00009888" value="0x141D0002" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2400" />
+        <register type="NOA" address="0x00009888" value="0x3E1F3000" />
+        <register type="NOA" address="0x00009888" value="0x461F5030" />
+        <register type="NOA" address="0x00009888" value="0x481F0050" />
+        <register type="NOA" address="0x00009888" value="0x4A1F2000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0020" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F2020" />
+        <register type="NOA" address="0x00009888" value="0x421F3030" />
+        <register type="NOA" address="0x00009888" value="0x441F5050" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000018" />
+        <register type="OA" address="0x00002774" value="0x0000FFFC" />
+        <register type="OA" address="0x00002778" value="0x00000060" />
+        <register type="OA" address="0x0000277C" value="0x0000FFF3" />
+        <register type="OA" address="0x00002780" value="0x00000180" />
+        <register type="OA" address="0x00002784" value="0x0000FFCF" />
+        <register type="OA" address="0x00002788" value="0x00000600" />
+        <register type="OA" address="0x0000278C" value="0x0000FF3F" />
+        <register type="OA" address="0x00002790" value="0x00001800" />
+        <register type="OA" address="0x00002794" value="0x0000FCFF" />
+        <register type="OA" address="0x00002798" value="0x00006000" />
+        <register type="OA" address="0x0000279C" value="0x0000F3FF" />
+        <register type="OA" address="0x000027A0" value="0x00018000" />
+        <register type="OA" address="0x000027A4" value="0x0000CFFF" />
+        <register type="OA" address="0x000027A8" value="0x00060000" />
+        <register type="OA" address="0x000027AC" value="0x00003FFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="c6d3af7b-037b-4656-95e1-4f838f0a2c14"
+       chipset="ICL"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice2 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 1 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice3 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice3 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 2 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread03_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread03ReadyForDispatch"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice0 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ B 7 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice7 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice7 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 6 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread07_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread07ReadyForDispatch"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice6 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice6 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 5 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread06_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread06ReadyForDispatch"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice5 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice5 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 4 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread05_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread05ReadyForDispatch"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice4 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice4 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 3 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread04_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread04ReadyForDispatch"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Non-PS Thread Ready For Dispatch on Slice0 Subslice1 Thread Dispatcher"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="GPU_CLOCK 0 READ C 0 READ FSUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14290000" />
+        <register type="NOA" address="0x00009888" value="0x142E0000" />
+        <register type="NOA" address="0x00009888" value="0x14690000" />
+        <register type="NOA" address="0x00009888" value="0x146E0000" />
+        <register type="NOA" address="0x00009888" value="0x14A90000" />
+        <register type="NOA" address="0x00009888" value="0x14AE0000" />
+        <register type="NOA" address="0x00009888" value="0x14E90000" />
+        <register type="NOA" address="0x00009888" value="0x14EE0000" />
+        <register type="NOA" address="0x00009888" value="0x1C1E0006" />
+        <register type="NOA" address="0x00009888" value="0x0E1F0006" />
+        <register type="NOA" address="0x00009888" value="0x1C200005" />
+        <register type="NOA" address="0x00009888" value="0x16210A00" />
+        <register type="NOA" address="0x00009888" value="0x0C29C100" />
+        <register type="NOA" address="0x00009888" value="0x22290000" />
+        <register type="NOA" address="0x00009888" value="0x1A2A0034" />
+        <register type="NOA" address="0x00009888" value="0x182C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A2C0002" />
+        <register type="NOA" address="0x00009888" value="0x0E2E00C1" />
+        <register type="NOA" address="0x00009888" value="0x102E0000" />
+        <register type="NOA" address="0x00009888" value="0x0E2F4000" />
+        <register type="NOA" address="0x00009888" value="0x1E300010" />
+        <register type="NOA" address="0x00009888" value="0x1C5E0008" />
+        <register type="NOA" address="0x00009888" value="0x125E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5F0008" />
+        <register type="NOA" address="0x00009888" value="0x025F8000" />
+        <register type="NOA" address="0x00009888" value="0x1C600010" />
+        <register type="NOA" address="0x00009888" value="0x02604000" />
+        <register type="NOA" address="0x00009888" value="0x16612000" />
+        <register type="NOA" address="0x00009888" value="0x02618000" />
+        <register type="NOA" address="0x00009888" value="0x0E69C100" />
+        <register type="NOA" address="0x00009888" value="0x22690000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A0040" />
+        <register type="NOA" address="0x00009888" value="0x026AC000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0008" />
+        <register type="NOA" address="0x00009888" value="0x066C8000" />
+        <register type="NOA" address="0x00009888" value="0x006EC100" />
+        <register type="NOA" address="0x00009888" value="0x106E0000" />
+        <register type="NOA" address="0x00009888" value="0x006F8000" />
+        <register type="NOA" address="0x00009888" value="0x1A700400" />
+        <register type="NOA" address="0x00009888" value="0x149E8000" />
+        <register type="NOA" address="0x00009888" value="0x169E8000" />
+        <register type="NOA" address="0x00009888" value="0x049F8000" />
+        <register type="NOA" address="0x00009888" value="0x069F8000" />
+        <register type="NOA" address="0x00009888" value="0x04A04000" />
+        <register type="NOA" address="0x00009888" value="0x06A04000" />
+        <register type="NOA" address="0x00009888" value="0x04A18000" />
+        <register type="NOA" address="0x00009888" value="0x06A18000" />
+        <register type="NOA" address="0x00009888" value="0x02A900C1" />
+        <register type="NOA" address="0x00009888" value="0x22A90000" />
+        <register type="NOA" address="0x00009888" value="0x04AA4000" />
+        <register type="NOA" address="0x00009888" value="0x06AAC000" />
+        <register type="NOA" address="0x00009888" value="0x08AC8000" />
+        <register type="NOA" address="0x00009888" value="0x0AAC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AEC100" />
+        <register type="NOA" address="0x00009888" value="0x10AE0000" />
+        <register type="NOA" address="0x00009888" value="0x02AF8000" />
+        <register type="NOA" address="0x00009888" value="0x1AB04000" />
+        <register type="NOA" address="0x00009888" value="0x18DEC000" />
+        <register type="NOA" address="0x00009888" value="0x08DF8000" />
+        <register type="NOA" address="0x00009888" value="0x0ADF8000" />
+        <register type="NOA" address="0x00009888" value="0x08E04000" />
+        <register type="NOA" address="0x00009888" value="0x0AE04000" />
+        <register type="NOA" address="0x00009888" value="0x08E18000" />
+        <register type="NOA" address="0x00009888" value="0x0AE18000" />
+        <register type="NOA" address="0x00009888" value="0x04E900C1" />
+        <register type="NOA" address="0x00009888" value="0x22E90000" />
+        <register type="NOA" address="0x00009888" value="0x1CE90000" />
+        <register type="NOA" address="0x00009888" value="0x08EA4000" />
+        <register type="NOA" address="0x00009888" value="0x0AEAC000" />
+        <register type="NOA" address="0x00009888" value="0x0CEC8000" />
+        <register type="NOA" address="0x00009888" value="0x0EEC8000" />
+        <register type="NOA" address="0x00009888" value="0x04EEC100" />
+        <register type="NOA" address="0x00009888" value="0x10EE0000" />
+        <register type="NOA" address="0x00009888" value="0x04EF8000" />
+        <register type="NOA" address="0x00009888" value="0x1CF00004" />
+        <register type="NOA" address="0x00009888" value="0x10040150" />
+        <register type="NOA" address="0x00009888" value="0x0C045000" />
+        <register type="NOA" address="0x00009888" value="0x0E040015" />
+        <register type="NOA" address="0x00009888" value="0x14050054" />
+        <register type="NOA" address="0x00009888" value="0x04054000" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x260600E0" />
+        <register type="NOA" address="0x00009888" value="0x24063E00" />
+        <register type="NOA" address="0x00009888" value="0x0E088000" />
+        <register type="NOA" address="0x00009888" value="0x00088000" />
+        <register type="NOA" address="0x00009888" value="0x14090040" />
+        <register type="NOA" address="0x00009888" value="0x04094000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x080E5000" />
+        <register type="NOA" address="0x00009888" value="0x1A120020" />
+        <register type="NOA" address="0x00009888" value="0x02128000" />
+        <register type="NOA" address="0x00009888" value="0x0412C000" />
+        <register type="NOA" address="0x00009888" value="0x0612C000" />
+        <register type="NOA" address="0x00009888" value="0x0A138000" />
+        <register type="NOA" address="0x00009888" value="0x0413E000" />
+        <register type="NOA" address="0x00009888" value="0x0E148000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x0214C000" />
+        <register type="NOA" address="0x00009888" value="0x16156000" />
+        <register type="NOA" address="0x00009888" value="0x18150007" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06154000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C188000" />
+        <register type="NOA" address="0x00009888" value="0x0E182000" />
+        <register type="NOA" address="0x00009888" value="0x1419000A" />
+        <register type="NOA" address="0x00009888" value="0x021CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A1DA000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x1C1F3061" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x521F4000" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2420" />
+        <register type="NOA" address="0x00009888" value="0x501F0024" />
+        <register type="NOA" address="0x00009888" value="0x4C1F3050" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F2000" />
+        <register type="NOA" address="0x00009888" value="0x421F5000" />
+        <register type="NOA" address="0x00009888" value="0x441F3730" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_3"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_3"
+       hw_config_guid="fd25ec19-3ed1-40c9-8648-1d2387449a92"
+       chipset="ICL"
+       symbol_name="TDL_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice6 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice6 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header06_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader06ReadyPort1"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice3 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice3 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header03_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader03ReadyPort0"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice3 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice3 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header03_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader03ReadyPort1"
+             availability="$SubsliceMask 8 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice4 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice4 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header04_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader04ReadyPort1"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice4 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice4 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header04_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader04ReadyPort0"
+             availability="$SubsliceMask 16 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice6 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice6 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header06_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader06ReadyPort0"
+             availability="$SubsliceMask 64 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice7 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice7 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header07_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader07ReadyPort0"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice5 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice5 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header05_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader05ReadyPort0"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice7 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice7 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header07_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader07ReadyPort1"
+             availability="$SubsliceMask 128 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ A 31 READ UADD A 32 READ UADD 64 UMUL"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice5 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice5 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header05_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader05ReadyPort1"
+             availability="$SubsliceMask 32 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Thread Dispatcher Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000000" />
+        <register type="NOA" address="0x00009888" value="0x14292C00" />
+        <register type="NOA" address="0x00009888" value="0x16290013" />
+        <register type="NOA" address="0x00009888" value="0x142E2C00" />
+        <register type="NOA" address="0x00009888" value="0x162E0013" />
+        <register type="NOA" address="0x00009888" value="0x14692C00" />
+        <register type="NOA" address="0x00009888" value="0x16690013" />
+        <register type="NOA" address="0x00009888" value="0x146E2C00" />
+        <register type="NOA" address="0x00009888" value="0x166E0013" />
+        <register type="NOA" address="0x00009888" value="0x14A92C00" />
+        <register type="NOA" address="0x00009888" value="0x16A90013" />
+        <register type="NOA" address="0x00009888" value="0x14AE2C00" />
+        <register type="NOA" address="0x00009888" value="0x16AE0013" />
+        <register type="NOA" address="0x00009888" value="0x14E92C00" />
+        <register type="NOA" address="0x00009888" value="0x16E90013" />
+        <register type="NOA" address="0x00009888" value="0x14EE2C00" />
+        <register type="NOA" address="0x00009888" value="0x16EE0013" />
+        <register type="NOA" address="0x00009888" value="0x101E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1E3800" />
+        <register type="NOA" address="0x00009888" value="0x001F8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1F3800" />
+        <register type="NOA" address="0x00009888" value="0x00204000" />
+        <register type="NOA" address="0x00009888" value="0x0E204000" />
+        <register type="NOA" address="0x00009888" value="0x1A2000A0" />
+        <register type="NOA" address="0x00009888" value="0x00218000" />
+        <register type="NOA" address="0x00009888" value="0x0E218000" />
+        <register type="NOA" address="0x00009888" value="0x14218000" />
+        <register type="NOA" address="0x00009888" value="0x16210002" />
+        <register type="NOA" address="0x00009888" value="0x002900C7" />
+        <register type="NOA" address="0x00009888" value="0x0629CF00" />
+        <register type="NOA" address="0x00009888" value="0x22290000" />
+        <register type="NOA" address="0x00009888" value="0x10290000" />
+        <register type="NOA" address="0x00009888" value="0x20290000" />
+        <register type="NOA" address="0x00009888" value="0x002A4000" />
+        <register type="NOA" address="0x00009888" value="0x0E2A4000" />
+        <register type="NOA" address="0x00009888" value="0x182A0F00" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x182C00A8" />
+        <register type="NOA" address="0x00009888" value="0x082ECFC7" />
+        <register type="NOA" address="0x00009888" value="0x102E0000" />
+        <register type="NOA" address="0x00009888" value="0x082FC000" />
+        <register type="NOA" address="0x00009888" value="0x1C300500" />
+        <register type="NOA" address="0x00009888" value="0x1A5EC000" />
+        <register type="NOA" address="0x00009888" value="0x1C5E0003" />
+        <register type="NOA" address="0x00009888" value="0x0C5FC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5F0003" />
+        <register type="NOA" address="0x00009888" value="0x1A602A00" />
+        <register type="NOA" address="0x00009888" value="0x1C600001" />
+        <register type="NOA" address="0x00009888" value="0x166102A8" />
+        <register type="NOA" address="0x00009888" value="0x0A69CFC7" />
+        <register type="NOA" address="0x00009888" value="0x22690000" />
+        <register type="NOA" address="0x00009888" value="0x186A5000" />
+        <register type="NOA" address="0x00009888" value="0x1A6A000F" />
+        <register type="NOA" address="0x00009888" value="0x186CAA00" />
+        <register type="NOA" address="0x00009888" value="0x0C6ECFC7" />
+        <register type="NOA" address="0x00009888" value="0x106E0000" />
+        <register type="NOA" address="0x00009888" value="0x0C6FC000" />
+        <register type="NOA" address="0x00009888" value="0x1E700005" />
+        <register type="NOA" address="0x00009888" value="0x1C9E000C" />
+        <register type="NOA" address="0x00009888" value="0x129E8000" />
+        <register type="NOA" address="0x00009888" value="0x149E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E9F000C" />
+        <register type="NOA" address="0x00009888" value="0x029F8000" />
+        <register type="NOA" address="0x00009888" value="0x049F8000" />
+        <register type="NOA" address="0x00009888" value="0x1CA00014" />
+        <register type="NOA" address="0x00009888" value="0x02A04000" />
+        <register type="NOA" address="0x00009888" value="0x04A04000" />
+        <register type="NOA" address="0x00009888" value="0x16A12800" />
+        <register type="NOA" address="0x00009888" value="0x02A18000" />
+        <register type="NOA" address="0x00009888" value="0x04A18000" />
+        <register type="NOA" address="0x00009888" value="0x0EA9CFC7" />
+        <register type="NOA" address="0x00009888" value="0x22A90000" />
+        <register type="NOA" address="0x00009888" value="0x1AAA0050" />
+        <register type="NOA" address="0x00009888" value="0x02AAC000" />
+        <register type="NOA" address="0x00009888" value="0x04AAC000" />
+        <register type="NOA" address="0x00009888" value="0x1AAC000A" />
+        <register type="NOA" address="0x00009888" value="0x06AC8000" />
+        <register type="NOA" address="0x00009888" value="0x08AC8000" />
+        <register type="NOA" address="0x00009888" value="0x00AEC700" />
+        <register type="NOA" address="0x00009888" value="0x02AE00CF" />
+        <register type="NOA" address="0x00009888" value="0x10AE0000" />
+        <register type="NOA" address="0x00009888" value="0x00AF8000" />
+        <register type="NOA" address="0x00009888" value="0x02AF4000" />
+        <register type="NOA" address="0x00009888" value="0x1AB01400" />
+        <register type="NOA" address="0x00009888" value="0x16DE8000" />
+        <register type="NOA" address="0x00009888" value="0x18DEC000" />
+        <register type="NOA" address="0x00009888" value="0x1ADE0400" />
+        <register type="NOA" address="0x00009888" value="0x06DF8000" />
+        <register type="NOA" address="0x00009888" value="0x08DF8000" />
+        <register type="NOA" address="0x00009888" value="0x0ADF8000" />
+        <register type="NOA" address="0x00009888" value="0x0CDF0400" />
+        <register type="NOA" address="0x00009888" value="0x06E04000" />
+        <register type="NOA" address="0x00009888" value="0x08E04000" />
+        <register type="NOA" address="0x00009888" value="0x0AE04000" />
+        <register type="NOA" address="0x00009888" value="0x0CE04000" />
+        <register type="NOA" address="0x00009888" value="0x06E18000" />
+        <register type="NOA" address="0x00009888" value="0x08E18000" />
+        <register type="NOA" address="0x00009888" value="0x0AE18000" />
+        <register type="NOA" address="0x00009888" value="0x0CE18000" />
+        <register type="NOA" address="0x00009888" value="0x02E9C700" />
+        <register type="NOA" address="0x00009888" value="0x04E900CF" />
+        <register type="NOA" address="0x00009888" value="0x22E90000" />
+        <register type="NOA" address="0x00009888" value="0x1CE90000" />
+        <register type="NOA" address="0x00009888" value="0x06EA4000" />
+        <register type="NOA" address="0x00009888" value="0x08EA4000" />
+        <register type="NOA" address="0x00009888" value="0x0AEAC000" />
+        <register type="NOA" address="0x00009888" value="0x0CEAC000" />
+        <register type="NOA" address="0x00009888" value="0x0AEC8000" />
+        <register type="NOA" address="0x00009888" value="0x0CEC8000" />
+        <register type="NOA" address="0x00009888" value="0x0EEC8000" />
+        <register type="NOA" address="0x00009888" value="0x18EC0002" />
+        <register type="NOA" address="0x00009888" value="0x04EEC700" />
+        <register type="NOA" address="0x00009888" value="0x06EE00CF" />
+        <register type="NOA" address="0x00009888" value="0x10EE0000" />
+        <register type="NOA" address="0x00009888" value="0x04EF8000" />
+        <register type="NOA" address="0x00009888" value="0x06EF4000" />
+        <register type="NOA" address="0x00009888" value="0x1CF00014" />
+        <register type="NOA" address="0x00009888" value="0x0C045400" />
+        <register type="NOA" address="0x00009888" value="0x0E045555" />
+        <register type="NOA" address="0x00009888" value="0x10040155" />
+        <register type="NOA" address="0x00009888" value="0x04055000" />
+        <register type="NOA" address="0x00009888" value="0x0A055000" />
+        <register type="NOA" address="0x00009888" value="0x0C055000" />
+        <register type="NOA" address="0x00009888" value="0x0E055000" />
+        <register type="NOA" address="0x00009888" value="0x14050055" />
+        <register type="NOA" address="0x00009888" value="0x06055000" />
+        <register type="NOA" address="0x00009888" value="0x08055000" />
+        <register type="NOA" address="0x00009888" value="0x2406FF00" />
+        <register type="NOA" address="0x00009888" value="0x260600FF" />
+        <register type="NOA" address="0x00009888" value="0x0A08A000" />
+        <register type="NOA" address="0x00009888" value="0x0C08A000" />
+        <register type="NOA" address="0x00009888" value="0x0E095000" />
+        <register type="NOA" address="0x00009888" value="0x14090005" />
+        <register type="NOA" address="0x00009888" value="0x020D8000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x060E4000" />
+        <register type="NOA" address="0x00009888" value="0x080E5000" />
+        <register type="NOA" address="0x00009888" value="0x0A0E1000" />
+        <register type="NOA" address="0x00009888" value="0x1812A800" />
+        <register type="NOA" address="0x00009888" value="0x1A12003E" />
+        <register type="NOA" address="0x00009888" value="0x0212C000" />
+        <register type="NOA" address="0x00009888" value="0x0412C000" />
+        <register type="NOA" address="0x00009888" value="0x0813C000" />
+        <register type="NOA" address="0x00009888" value="0x0A13F000" />
+        <register type="NOA" address="0x00009888" value="0x04136000" />
+        <register type="NOA" address="0x00009888" value="0x0A14C000" />
+        <register type="NOA" address="0x00009888" value="0x0C14C000" />
+        <register type="NOA" address="0x00009888" value="0x0E14C000" />
+        <register type="NOA" address="0x00009888" value="0x00148000" />
+        <register type="NOA" address="0x00009888" value="0x02144000" />
+        <register type="NOA" address="0x00009888" value="0x0015C000" />
+        <register type="NOA" address="0x00009888" value="0x0E15C000" />
+        <register type="NOA" address="0x00009888" value="0x16152AF8" />
+        <register type="NOA" address="0x00009888" value="0x18150005" />
+        <register type="NOA" address="0x00009888" value="0x02154000" />
+        <register type="NOA" address="0x00009888" value="0x04154000" />
+        <register type="NOA" address="0x00009888" value="0x06158000" />
+        <register type="NOA" address="0x00009888" value="0x08158000" />
+        <register type="NOA" address="0x00009888" value="0x0A158000" />
+        <register type="NOA" address="0x00009888" value="0x0C158000" />
+        <register type="NOA" address="0x00009888" value="0x00182000" />
+        <register type="NOA" address="0x00009888" value="0x06188000" />
+        <register type="NOA" address="0x00009888" value="0x0818A000" />
+        <register type="NOA" address="0x00009888" value="0x08192000" />
+        <register type="NOA" address="0x00009888" value="0x0E198000" />
+        <register type="NOA" address="0x00009888" value="0x12190140" />
+        <register type="NOA" address="0x00009888" value="0x0E1CA000" />
+        <register type="NOA" address="0x00009888" value="0x001C8000" />
+        <register type="NOA" address="0x00009888" value="0x021C2000" />
+        <register type="NOA" address="0x00009888" value="0x141D0028" />
+        <register type="NOA" address="0x00009888" value="0x081D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A1D2000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x301F8000" />
+        <register type="NOA" address="0x00009888" value="0x501F4924" />
+        <register type="NOA" address="0x00009888" value="0x521F4924" />
+        <register type="NOA" address="0x00009888" value="0x541F0024" />
+        <register type="NOA" address="0x00009888" value="0x3A1F8000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2420" />
+        <register type="NOA" address="0x00009888" value="0x3E1F5000" />
+        <register type="NOA" address="0x00009888" value="0x461F3050" />
+        <register type="NOA" address="0x00009888" value="0x481F2030" />
+        <register type="NOA" address="0x00009888" value="0x4A1F0020" />
+        <register type="NOA" address="0x00009888" value="0x4C1F2000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F0000" />
+        <register type="NOA" address="0x00009888" value="0x421F5050" />
+        <register type="NOA" address="0x00009888" value="0x441F3030" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="40dc79f2-88c8-47c6-8f86-f509e39fbe5d"
+       chipset="ICL"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Posh Ring Busy"
+             description="The percentage of time when posh command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="posh_engine_busy"
+             units="percent"
+             symbol_name="PoshEngineBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x0E061200" />
+        <register type="NOA" address="0x00009888" value="0x22062400" />
+        <register type="NOA" address="0x00009888" value="0x10002400" />
+        <register type="NOA" address="0x00009888" value="0x00038000" />
+        <register type="NOA" address="0x00009888" value="0x06032000" />
+        <register type="NOA" address="0x00009888" value="0x020600F3" />
+        <register type="NOA" address="0x00009888" value="0x0C060043" />
+        <register type="NOA" address="0x00009888" value="0x20060000" />
+        <register type="NOA" address="0x00009888" value="0x02000023" />
+        <register type="NOA" address="0x00009888" value="0x20002000" />
+        <register type="NOA" address="0x00009888" value="0x081A8000" />
+        <register type="NOA" address="0x00009888" value="0x3A1F6000" />
+        <register type="NOA" address="0x00009888" value="0x4E1F2900" />
+        <register type="NOA" address="0x00009888" value="0x501F00E9" />
+        <register type="NOA" address="0x00009888" value="0x10204000" />
+        <register type="NOA" address="0x00009888" value="0x0C214000" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x401F4131" />
+        <register type="NOA" address="0x00009888" value="0x421F1021" />
+        <register type="NOA" address="0x00009888" value="0x441F3100" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+        <register type="NOA" address="0x00009884" value="0x00000002" />
+        <register type="NOA" address="0x00009888" value="0x181B2400" />
+        <register type="NOA" address="0x00009888" value="0x185B2400" />
+        <register type="NOA" address="0x00009888" value="0x12240120" />
+        <register type="NOA" address="0x00009888" value="0x06218000" />
+        <register type="NOA" address="0x00009888" value="0x08212000" />
+        <register type="NOA" address="0x00009888" value="0x0A0A8000" />
+        <register type="NOA" address="0x00009888" value="0x180B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A0C8000" />
+        <register type="NOA" address="0x00009888" value="0x040F8000" />
+        <register type="NOA" address="0x00009888" value="0x0E080010" />
+        <register type="NOA" address="0x00009888" value="0x041B8300" />
+        <register type="NOA" address="0x00009888" value="0x101B0000" />
+        <register type="NOA" address="0x00009888" value="0x221B0000" />
+        <register type="NOA" address="0x00009888" value="0x041E4000" />
+        <register type="NOA" address="0x00009888" value="0x084A8000" />
+        <register type="NOA" address="0x00009888" value="0x184B4000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x044F2000" />
+        <register type="NOA" address="0x00009888" value="0x0E480004" />
+        <register type="NOA" address="0x00009888" value="0x045B0083" />
+        <register type="NOA" address="0x00009888" value="0x105B0000" />
+        <register type="NOA" address="0x00009888" value="0x225B0000" />
+        <register type="NOA" address="0x00009888" value="0x045E1000" />
+        <register type="NOA" address="0x00009888" value="0x0823A000" />
+        <register type="NOA" address="0x00009888" value="0x02242980" />
+        <register type="NOA" address="0x00009888" value="0x10240000" />
+        <register type="NOA" address="0x00009888" value="0x06240000" />
+        <register type="NOA" address="0x00009888" value="0x0A244000" />
+        <register type="NOA" address="0x00009888" value="0x1C250004" />
+        <register type="NOA" address="0x00009888" value="0x08268000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TestOa"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="3c0bf614-5d67-4326-887f-a24eb8a58244"
+       chipset="ICL"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.6666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.3333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.16666"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00000D04" value="0x00000200" />
+        <register type="NOA" address="0x00009840" value="0x00000000" />
+        <register type="NOA" address="0x00009884" value="0x00000003" />
+        <register type="NOA" address="0x00009888" value="0x16130000" />
+        <register type="NOA" address="0x00009888" value="0x24000001" />
+        <register type="NOA" address="0x00009888" value="0x0E130056" />
+        <register type="NOA" address="0x00009888" value="0x10130000" />
+        <register type="NOA" address="0x00009888" value="0x1A130000" />
+        <register type="NOA" address="0x00009888" value="0x541F0001" />
+        <register type="NOA" address="0x00009888" value="0x181F0000" />
+        <register type="NOA" address="0x00009888" value="0x4C1F0000" />
+        <register type="NOA" address="0x00009888" value="0x301F0000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x0000FFFF" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFF" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x0000FFFF" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-kblgt2.xml b/lib/i915/perf-configs/oa-kblgt2.xml
new file mode 100644
index 00000000..90db48bc
--- /dev/null
+++ b/lib/i915/perf-configs/oa-kblgt2.xml
@@ -0,0 +1,10866 @@
+<?xml version="1.0"?>
+<metrics version="1562317148" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="99c1a40e-a090-4354-86e3-4d068bb1917e"
+       chipset="KBLGT2"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0080" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C2200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190001F" />
+        <register type="NOA" address="0x00009888" value="0x51904400" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C21" />
+        <register type="NOA" address="0x00009888" value="0x47900061" />
+        <register type="NOA" address="0x00009888" value="0x57904440" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900004" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="e17fc42a-e614-41b6-90c4-1074841a6c77"
+       chipset="KBLGT2"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900422" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="d7a17a3a-ca71-40d2-a919-ace80d50633f"
+       chipset="KBLGT2"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900440" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900C21" />
+        <register type="NOA" address="0x00009888" value="0x57900400" />
+        <register type="NOA" address="0x00009888" value="0x49900042" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900024" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900841" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="57b59202-172b-477a-87de-33f85572c589"
+       chipset="KBLGT2"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="3addf8ef-8e9b-40f5-a448-3dbb5d5128b0"
+       chipset="KBLGT2"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="4af0400a-81c3-47db-a6b6-deddbd75680e"
+       chipset="KBLGT2"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="0e22f995-79ca-4f67-83ab-e9d9772488d8"
+       chipset="KBLGT2"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="fb149d66-fad2-4230-b0d7-4d689b9116d3"
+       chipset="KBLGT2"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="f889f8cc-4c93-4ac8-b75f-551c0b9b87f7"
+       chipset="KBLGT2"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="6d344efd-8e9e-42d4-a29e-1011c29f82c2"
+       chipset="KBLGT2"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="e3b386ae-c195-47d5-af29-8a1afa0ae2bf"
+       chipset="KBLGT2"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="f9954679-a055-4862-9f57-9d66e3ebf81c"
+       chipset="KBLGT2"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="4ed5e27e-fd1a-4f11-ad8f-9374e128c697"
+       chipset="KBLGT2"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="9eaf384d-8f53-41b8-a71d-108308780fbc"
+       chipset="KBLGT2"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="a00cbdf2-eabd-4240-9a89-86e2ac1ca1e4"
+       chipset="KBLGT2"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="aa7a3fb9-22fb-43ff-a32d-0ab6c13bbd16"
+       chipset="KBLGT2"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006C" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x1190E000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C00" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="398a4268-ef6f-4ffc-b55f-3c7b5363ce61"
+       chipset="KBLGT2"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x143A5800" />
+        <register type="NOA" address="0x00009888" value="0x163A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12380240" />
+        <register type="NOA" address="0x00009888" value="0x14380002" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C1500" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F9500" />
+        <register type="NOA" address="0x00009888" value="0x100F002A" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x0A2DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C2DC000" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x06393000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A28C1" />
+        <register type="NOA" address="0x00009888" value="0x003A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A33F000" />
+        <register type="NOA" address="0x00009888" value="0x0C33F000" />
+        <register type="NOA" address="0x00009888" value="0x0A37A000" />
+        <register type="NOA" address="0x00009888" value="0x0C37A000" />
+        <register type="NOA" address="0x00009888" value="0x0A380977" />
+        <register type="NOA" address="0x00009888" value="0x08380000" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x06383000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900800" />
+        <register type="NOA" address="0x00009888" value="0x47901000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900844" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="6c66fe6e-2988-454a-bfae-7fca3bbcbec2"
+       chipset="KBLGT2"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C00" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x19C05800" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x07960025" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x1B930062" />
+        <register type="NOA" address="0x00009888" value="0x17948000" />
+        <register type="NOA" address="0x00009888" value="0x1B940008" />
+        <register type="NOA" address="0x00009888" value="0x05950075" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x05C08500" />
+        <register type="NOA" address="0x00009888" value="0x25C00000" />
+        <register type="NOA" address="0x00009888" value="0x1BC00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C60" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00078000" />
+        <register type="OA" address="0x00002774" value="0x00000FFF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9.5"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="baa3c7e4-52b6-4b85-801e-465a94b746dd"
+       chipset="KBLGT2"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="b49aa434-4958-4d98-9e6f-443ff27ca74d"
+       chipset="KBLGT2"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-kblgt3.xml b/lib/i915/perf-configs/oa-kblgt3.xml
new file mode 100644
index 00000000..9a26caac
--- /dev/null
+++ b/lib/i915/perf-configs/oa-kblgt3.xml
@@ -0,0 +1,10933 @@
+<?xml version="1.0"?>
+<metrics version="1562317148" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="17b4f3e0-d578-4ae3-b7a8-98d756d1e0df"
+       chipset="KBLGT3"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x16EC01E0" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0380" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0002" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x100F0001" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CA200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x1ACE0200" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5300" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1CEC0000" />
+        <register type="NOA" address="0x00009888" value="0x0A9B8000" />
+        <register type="NOA" address="0x00009888" value="0x1C9C0002" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0002" />
+        <register type="NOA" address="0x00009888" value="0x0A8D8000" />
+        <register type="NOA" address="0x00009888" value="0x108F0001" />
+        <register type="NOA" address="0x00009888" value="0x16AC8000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51902240" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x55900242" />
+        <register type="NOA" address="0x00009888" value="0x45900084" />
+        <register type="NOA" address="0x00009888" value="0x47901400" />
+        <register type="NOA" address="0x00009888" value="0x57902220" />
+        <register type="NOA" address="0x00009888" value="0x49900C60" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900002" />
+        <register type="NOA" address="0x00009888" value="0x43900C63" />
+        <register type="NOA" address="0x00009888" value="0x53902222" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="9823aaa1-b06f-40ce-884b-cd798c79f0c2"
+       chipset="KBLGT3"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900422" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="c7c735f3-ce58-45cf-aa04-30b183f1faff"
+       chipset="KBLGT3"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900440" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900C21" />
+        <register type="NOA" address="0x00009888" value="0x57900400" />
+        <register type="NOA" address="0x00009888" value="0x49900042" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900024" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900841" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="96ec2219-040b-428a-856a-6bc03363a057"
+       chipset="KBLGT3"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="03372b64-4996-4d3b-aa18-790e75eeb9c2"
+       chipset="KBLGT3"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="31b4ce5a-bd61-4c1f-bb5d-f2e731412150"
+       chipset="KBLGT3"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="2ce0911a-27fc-4887-96f0-11084fa807c3"
+       chipset="KBLGT3"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="b128f45f-bfa2-4991-aadc-05be7898e398"
+       chipset="KBLGT3"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="f3566b55-9c13-47bf-8327-4a887af75262"
+       chipset="KBLGT3"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="7b21aa68-9076-4ab4-8a84-e45a06c8eac6"
+       chipset="KBLGT3"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="71b4b9dd-ae28-48ce-9a1a-5431e1f23afd"
+       chipset="KBLGT3"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="52c646ca-52da-4853-877e-8645e73ed330"
+       chipset="KBLGT3"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="c4bb682f-677c-4875-990b-005230be87b4"
+       chipset="KBLGT3"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="ade8521b-5e72-45d4-8c25-d9f0da774899"
+       chipset="KBLGT3"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="9df2815d-4e9e-417f-bde1-3788dc6e1ea1"
+       chipset="KBLGT3"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="efc497ac-884e-4ee4-a4a8-15fba22aaf21"
+       chipset="KBLGT3"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 5 READ C 6 READ FADD C 7 READ FADD C 2 READ FADD C 3 READ FADD C 4 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x129203E0" />
+        <register type="NOA" address="0x00009888" value="0x12B203E0" />
+        <register type="NOA" address="0x00009888" value="0x12D203E0" />
+        <register type="NOA" address="0x00009888" value="0x024EC000" />
+        <register type="NOA" address="0x00009888" value="0x044EC000" />
+        <register type="NOA" address="0x00009888" value="0x064EC000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0042" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006D" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x00AF8000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC0001" />
+        <register type="NOA" address="0x00009888" value="0x008D8000" />
+        <register type="NOA" address="0x00009888" value="0x028DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F0001" />
+        <register type="NOA" address="0x00009888" value="0x06AC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AD4000" />
+        <register type="NOA" address="0x00009888" value="0x02908000" />
+        <register type="NOA" address="0x00009888" value="0x02918000" />
+        <register type="NOA" address="0x00009888" value="0x02921980" />
+        <register type="NOA" address="0x00009888" value="0x00920000" />
+        <register type="NOA" address="0x00009888" value="0x02934000" />
+        <register type="NOA" address="0x00009888" value="0x02B04000" />
+        <register type="NOA" address="0x00009888" value="0x02B14000" />
+        <register type="NOA" address="0x00009888" value="0x02B20033" />
+        <register type="NOA" address="0x00009888" value="0x00B20000" />
+        <register type="NOA" address="0x00009888" value="0x02B31000" />
+        <register type="NOA" address="0x00009888" value="0x00D08000" />
+        <register type="NOA" address="0x00009888" value="0x00D18000" />
+        <register type="NOA" address="0x00009888" value="0x00D21980" />
+        <register type="NOA" address="0x00009888" value="0x00D34000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900002" />
+        <register type="NOA" address="0x00009888" value="0x53900420" />
+        <register type="NOA" address="0x00009888" value="0x459000A1" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="bfd9764d-2c5b-4c16-bfc1-89de3ca10917"
+       chipset="KBLGT3"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x149A5800" />
+        <register type="NOA" address="0x00009888" value="0x169A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12980240" />
+        <register type="NOA" address="0x00009888" value="0x14980002" />
+        <register type="NOA" address="0x00009888" value="0x1A4E3FC0" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C9500" />
+        <register type="NOA" address="0x00009888" value="0x0C4C002A" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0015" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C000A" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x04AFC000" />
+        <register type="NOA" address="0x00009888" value="0x06AF3000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0015" />
+        <register type="NOA" address="0x00009888" value="0x0A8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F4000" />
+        <register type="NOA" address="0x00009888" value="0x108F0015" />
+        <register type="NOA" address="0x00009888" value="0x16ACA000" />
+        <register type="NOA" address="0x00009888" value="0x18AC000A" />
+        <register type="NOA" address="0x00009888" value="0x06993000" />
+        <register type="NOA" address="0x00009888" value="0x0C9A28C1" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A93F000" />
+        <register type="NOA" address="0x00009888" value="0x0C93F000" />
+        <register type="NOA" address="0x00009888" value="0x0A97A000" />
+        <register type="NOA" address="0x00009888" value="0x0C97A000" />
+        <register type="NOA" address="0x00009888" value="0x0A980977" />
+        <register type="NOA" address="0x00009888" value="0x08980000" />
+        <register type="NOA" address="0x00009888" value="0x04980000" />
+        <register type="NOA" address="0x00009888" value="0x06983000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900040" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900004" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x479008A5" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900002" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="b55ecba1-2aa9-422e-89ff-b9e30f03d447"
+       chipset="KBLGT3"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x19D05800" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C25" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x19C05800" />
+        <register type="NOA" address="0x00009888" value="0x05D00085" />
+        <register type="NOA" address="0x00009888" value="0x25D00000" />
+        <register type="NOA" address="0x00009888" value="0x09D54000" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0996C000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x19938000" />
+        <register type="NOA" address="0x00009888" value="0x1B930068" />
+        <register type="NOA" address="0x00009888" value="0x15948000" />
+        <register type="NOA" address="0x00009888" value="0x1B94000C" />
+        <register type="NOA" address="0x00009888" value="0x03957500" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x17950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x07928000" />
+        <register type="NOA" address="0x00009888" value="0x03988000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x05C08500" />
+        <register type="NOA" address="0x00009888" value="0x25C00000" />
+        <register type="NOA" address="0x00009888" value="0x1BC00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900463" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="f1792f32-6db2-4b50-b4b2-557128f1688d"
+       chipset="KBLGT3"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="85bc2e4f-2563-4388-921b-dc0dad879cf3"
+       chipset="KBLGT3"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-sklgt2.xml b/lib/i915/perf-configs/oa-sklgt2.xml
new file mode 100644
index 00000000..ba8d2b4c
--- /dev/null
+++ b/lib/i915/perf-configs/oa-sklgt2.xml
@@ -0,0 +1,11895 @@
+<?xml version="1.0"?>
+<metrics version="1562317147" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="07b25942-d9fd-4fce-bd58-e29abd66b7de"
+       chipset="SKLGT2"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x02 UGTE"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0080" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C2200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190001F" />
+        <register type="NOA" address="0x00009888" value="0x51904400" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C21" />
+        <register type="NOA" address="0x00009888" value="0x47900061" />
+        <register type="NOA" address="0x00009888" value="0x57904440" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900004" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53904444" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="00b80b4c-d215-4378-9015-da3dda3b61ea"
+       chipset="SKLGT2"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND $SkuRevisionId 0x02 ULT &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901403" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8200" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F0DB2" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F1880" />
+        <register type="NOA" address="0x00009888" value="0x0A4F0011" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E3C" />
+        <register type="NOA" address="0x00009888" value="0x0E4F1D80" />
+        <register type="NOA" address="0x00009888" value="0x086C0002" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0100" />
+        <register type="NOA" address="0x00009888" value="0x0E6C000C" />
+        <register type="NOA" address="0x00009888" value="0x026C000B" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x081B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B4000" />
+        <register type="NOA" address="0x00009888" value="0x021B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0012" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x005BC000" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B8000" />
+        <register type="NOA" address="0x00009888" value="0x0A5B4000" />
+        <register type="NOA" address="0x00009888" value="0x0C5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B8000" />
+        <register type="NOA" address="0x00009888" value="0x105C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A5CA000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C002D" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0082" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002CC000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CBE00" />
+        <register type="NOA" address="0x00009888" value="0x182C00EF" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900167" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900840" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900842" />
+        <register type="NOA" address="0x00009888" value="0x47900840" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900840" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900840" />
+        <register type="NOA" address="0x00009888" value="0x53901111" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND $SkuRevisionId 0x02 UGTE &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901403" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1810" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900167" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900842" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53901111" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="2a0c0933-37e7-427c-9951-ded42a78bb27"
+       chipset="SKLGT2"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x02 ULT"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x15968000" />
+        <register type="NOA" address="0x00009888" value="0x17968000" />
+        <register type="NOA" address="0x00009888" value="0x0F96C000" />
+        <register type="NOA" address="0x00009888" value="0x1F950011" />
+        <register type="NOA" address="0x00009888" value="0x1D950014" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x0B978000" />
+        <register type="NOA" address="0x00009888" value="0x0F974000" />
+        <register type="NOA" address="0x00009888" value="0x11974000" />
+        <register type="NOA" address="0x00009888" value="0x13978000" />
+        <register type="NOA" address="0x00009888" value="0x09974000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x419010A0" />
+        <register type="NOA" address="0x00009888" value="0x55904000" />
+        <register type="NOA" address="0x00009888" value="0x45901000" />
+        <register type="NOA" address="0x00009888" value="0x47900084" />
+        <register type="NOA" address="0x00009888" value="0x57904400" />
+        <register type="NOA" address="0x00009888" value="0x499000A5" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900081" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x439014A4" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x02 UGTE"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x05E5A000" />
+        <register type="NOA" address="0x00009888" value="0x01E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x419010A0" />
+        <register type="NOA" address="0x00009888" value="0x55904000" />
+        <register type="NOA" address="0x00009888" value="0x45901000" />
+        <register type="NOA" address="0x00009888" value="0x47900084" />
+        <register type="NOA" address="0x00009888" value="0x57904400" />
+        <register type="NOA" address="0x00009888" value="0x499000A5" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900081" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x439014A4" />
+        <register type="NOA" address="0x00009888" value="0x53900400" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="246b35f1-44e0-4d03-8936-e452e291d064"
+       chipset="SKLGT2"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND $SkuRevisionId 0x02 ULT &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x13946000" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x0F968000" />
+        <register type="NOA" address="0x00009888" value="0x1196C000" />
+        <register type="NOA" address="0x00009888" value="0x13964000" />
+        <register type="NOA" address="0x00009888" value="0x11938000" />
+        <register type="NOA" address="0x00009888" value="0x1B93FE00" />
+        <register type="NOA" address="0x00009888" value="0x01940010" />
+        <register type="NOA" address="0x00009888" value="0x07941100" />
+        <register type="NOA" address="0x00009888" value="0x09941312" />
+        <register type="NOA" address="0x00009888" value="0x0B941514" />
+        <register type="NOA" address="0x00009888" value="0x0D941716" />
+        <register type="NOA" address="0x00009888" value="0x11940000" />
+        <register type="NOA" address="0x00009888" value="0x19940000" />
+        <register type="NOA" address="0x00009888" value="0x1B940000" />
+        <register type="NOA" address="0x00009888" value="0x1D940000" />
+        <register type="NOA" address="0x00009888" value="0x1B954000" />
+        <register type="NOA" address="0x00009888" value="0x1D95A550" />
+        <register type="NOA" address="0x00009888" value="0x1F9502AA" />
+        <register type="NOA" address="0x00009888" value="0x2F900157" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x05 ULT $SkuRevisionId 0x02 UGTE &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x13946000" />
+        <register type="NOA" address="0x00009888" value="0x15940016" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x19930800" />
+        <register type="NOA" address="0x00009888" value="0x1B93AA55" />
+        <register type="NOA" address="0x00009888" value="0x1D9300AA" />
+        <register type="NOA" address="0x00009888" value="0x01940010" />
+        <register type="NOA" address="0x00009888" value="0x07941100" />
+        <register type="NOA" address="0x00009888" value="0x09941312" />
+        <register type="NOA" address="0x00009888" value="0x0B941514" />
+        <register type="NOA" address="0x00009888" value="0x0D941716" />
+        <register type="NOA" address="0x00009888" value="0x0F940018" />
+        <register type="NOA" address="0x00009888" value="0x1B940000" />
+        <register type="NOA" address="0x00009888" value="0x11940000" />
+        <register type="NOA" address="0x00009888" value="0x01E58000" />
+        <register type="NOA" address="0x00009888" value="0x03E57000" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C20" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900421" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900421" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900061" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x05 UGTE"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="e0d3da02-00bf-4a96-9795-b48158c73a68"
+       chipset="SKLGT2"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA"
+                     availability="$SliceMask 0x01 AND $SkuRevisionId 0x02 ULT &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x13945400" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901400" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x0F968000" />
+        <register type="NOA" address="0x00009888" value="0x1196C000" />
+        <register type="NOA" address="0x00009888" value="0x13964000" />
+        <register type="NOA" address="0x00009888" value="0x11938000" />
+        <register type="NOA" address="0x00009888" value="0x1B93FE00" />
+        <register type="NOA" address="0x00009888" value="0x01940010" />
+        <register type="NOA" address="0x00009888" value="0x07941100" />
+        <register type="NOA" address="0x00009888" value="0x09941312" />
+        <register type="NOA" address="0x00009888" value="0x0B941514" />
+        <register type="NOA" address="0x00009888" value="0x0D941716" />
+        <register type="NOA" address="0x00009888" value="0x11940000" />
+        <register type="NOA" address="0x00009888" value="0x19940000" />
+        <register type="NOA" address="0x00009888" value="0x1B940000" />
+        <register type="NOA" address="0x00009888" value="0x1D940000" />
+        <register type="NOA" address="0x00009888" value="0x1B954000" />
+        <register type="NOA" address="0x00009888" value="0x1D95A550" />
+        <register type="NOA" address="0x00009888" value="0x1F9502AA" />
+        <register type="NOA" address="0x00009888" value="0x2F900167" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="NOA"
+                     availability="$SkuRevisionId 0x05 ULT $SkuRevisionId 0x02 UGTE &&"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x13945400" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901400" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x19930800" />
+        <register type="NOA" address="0x00009888" value="0x1B93AA55" />
+        <register type="NOA" address="0x00009888" value="0x1D93002A" />
+        <register type="NOA" address="0x00009888" value="0x01940010" />
+        <register type="NOA" address="0x00009888" value="0x07941100" />
+        <register type="NOA" address="0x00009888" value="0x09941312" />
+        <register type="NOA" address="0x00009888" value="0x0B941514" />
+        <register type="NOA" address="0x00009888" value="0x0D941716" />
+        <register type="NOA" address="0x00009888" value="0x1B940000" />
+        <register type="NOA" address="0x00009888" value="0x11940000" />
+        <register type="NOA" address="0x00009888" value="0x01E58000" />
+        <register type="NOA" address="0x00009888" value="0x03E57000" />
+        <register type="NOA" address="0x00009888" value="0x2F900167" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x13908000" />
+        <register type="NOA" address="0x00009888" value="0x21908000" />
+        <register type="NOA" address="0x00009888" value="0x23908000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27908000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C20" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900421" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900421" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="c26b1fda-2752-4a33-a448-4c8718366846"
+       chipset="SKLGT2"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA"
+                     availability="$SubsliceMask 0x01 AND"
+                     priority="0"
+                     >
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="9fb22842-e708-43f7-9752-e0e41670c39e"
+       chipset="SKLGT2"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F901403" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900167" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900042" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53901111" />
+        <register type="NOA" address="0x00009888" value="0x43900420" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="b4aa5e13-2d25-418f-827d-421f5cc4c43b"
+       chipset="SKLGT2"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x4B9000A0" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="504000e8-64f2-4aac-8301-51b81aa60d45"
+       chipset="SKLGT2"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="f542479b-6685-4670-ad8e-9fe282a2eb5b"
+       chipset="SKLGT2"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="1cbf1e9f-c2de-4cc2-8d1c-2c33c25a2332"
+       chipset="SKLGT2"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="b4e54cc8-a3a0-4ccd-9990-65d3184e5a38"
+       chipset="SKLGT2"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="efe7eba4-fd9e-4a09-a92b-334970b5de57"
+       chipset="SKLGT2"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="e9bd0bbb-c7b7-4a26-a27a-246987354776"
+       chipset="SKLGT2"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="0a7accbf-8c55-455f-9984-23e9fb0b826d"
+       chipset="SKLGT2"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x000000A0" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="41a24047-7484-4ead-ae37-de907e5ff2b2"
+       chipset="SKLGT2"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 7 READ C 6 READ FADD C 5 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006C" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x1190E000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C00" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00001000" />
+        <register type="FLEX" address="0x0000E558" value="0x00003002" />
+        <register type="FLEX" address="0x0000E658" value="0x00005004" />
+        <register type="FLEX" address="0x0000E758" value="0x00011010" />
+        <register type="FLEX" address="0x0000E45C" value="0x00050012" />
+        <register type="FLEX" address="0x0000E55C" value="0x00052051" />
+        <register type="FLEX" address="0x0000E65C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="95910492-943f-44bd-9461-390240f243fd"
+       chipset="SKLGT2"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x143A5800" />
+        <register type="NOA" address="0x00009888" value="0x163A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12380240" />
+        <register type="NOA" address="0x00009888" value="0x14380002" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C1500" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F9500" />
+        <register type="NOA" address="0x00009888" value="0x100F002A" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x0A2DC000" />
+        <register type="NOA" address="0x00009888" value="0x0C2DC000" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x06393000" />
+        <register type="NOA" address="0x00009888" value="0x0C3A28C1" />
+        <register type="NOA" address="0x00009888" value="0x003A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A33F000" />
+        <register type="NOA" address="0x00009888" value="0x0C33F000" />
+        <register type="NOA" address="0x00009888" value="0x0A37A000" />
+        <register type="NOA" address="0x00009888" value="0x0C37A000" />
+        <register type="NOA" address="0x00009888" value="0x0A380977" />
+        <register type="NOA" address="0x00009888" value="0x08380000" />
+        <register type="NOA" address="0x00009888" value="0x04380000" />
+        <register type="NOA" address="0x00009888" value="0x06383000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900800" />
+        <register type="NOA" address="0x00009888" value="0x47901000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900844" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="c44a5cf7-886d-477b-bebd-2d738923e4c3"
+       chipset="SKLGT2"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C00" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x21C05800" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x07960025" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x1B930062" />
+        <register type="NOA" address="0x00009888" value="0x17948000" />
+        <register type="NOA" address="0x00009888" value="0x1B940008" />
+        <register type="NOA" address="0x00009888" value="0x05950075" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x0BC000A5" />
+        <register type="NOA" address="0x00009888" value="0x11C00000" />
+        <register type="NOA" address="0x00009888" value="0x05C00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C60" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00078000" />
+        <register type="OA" address="0x00002774" value="0x00000FFF" />
+    </register_config>
+  </set>
+
+  <set name="FF Bottlenecks"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="ff_bottlenecks"
+       hw_config_guid="e0b2aae4-9b8f-4211-8df0-f8e8cb203209"
+       chipset="SKLGT2"
+       symbol_name="FfBottlenecks"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS is sending vertices to CL"
+             description="The percentage of time in which VS is sending vertices to CL bypassing other pipeline stages."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 4 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_cl_bypass"
+             units="percent"
+             symbol_name="VsClBypass"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw Tier3"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 1 READ B 5 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TE Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which tesselation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ B 6 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="te_bottleneck"
+             units="percent"
+             symbol_name="TeBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 17 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x19867C00" />
+        <register type="NOA" address="0x00009888" value="0x01870000" />
+        <register type="NOA" address="0x00009888" value="0x15880000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0B898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890C00" />
+        <register type="NOA" address="0x00009888" value="0x0D808000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A2000" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0003" />
+        <register type="NOA" address="0x00009888" value="0x1F810002" />
+        <register type="NOA" address="0x00009888" value="0x0982C000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x05833000" />
+        <register type="NOA" address="0x00009888" value="0x07831000" />
+        <register type="NOA" address="0x00009888" value="0x0D848000" />
+        <register type="NOA" address="0x00009888" value="0x0D850080" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x09860080" />
+        <register type="NOA" address="0x00009888" value="0x0D860080" />
+        <register type="NOA" address="0x00009888" value="0x07870C80" />
+        <register type="NOA" address="0x00009888" value="0x0B870C80" />
+        <register type="NOA" address="0x00009888" value="0x01880032" />
+        <register type="NOA" address="0x00009888" value="0x0B888032" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x07888000" />
+        <register type="NOA" address="0x00009888" value="0x1D930010" />
+        <register type="NOA" address="0x00009888" value="0x1D950013" />
+        <register type="NOA" address="0x00009888" value="0x0DE58000" />
+        <register type="NOA" address="0x00009888" value="0x05924000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D92C000" />
+        <register type="NOA" address="0x00009888" value="0x0F92C000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x01981000" />
+        <register type="NOA" address="0x00009888" value="0x07984000" />
+        <register type="NOA" address="0x00009888" value="0x0998A000" />
+        <register type="NOA" address="0x00009888" value="0x0B985000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25904000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29904000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900020" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900400" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00000011" />
+        <register type="FLEX" address="0x0000E758" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00000008" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="1651949f-0ac0-4cb1-a06f-dafd74a407d1"
+       chipset="SKLGT2"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810016" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="27871149-2fa9-40ba-aa73-350d60c03a09"
+       chipset="SKLGT2"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-sklgt3.xml b/lib/i915/perf-configs/oa-sklgt3.xml
new file mode 100644
index 00000000..05473fdb
--- /dev/null
+++ b/lib/i915/perf-configs/oa-sklgt3.xml
@@ -0,0 +1,10933 @@
+<?xml version="1.0"?>
+<metrics version="1562317147" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="21fef15a-83f4-4ffa-bb81-7da6e38b8e4b"
+       chipset="SKLGT3"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler 1 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 1 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler1_bottleneck"
+             units="percent"
+             symbol_name="Sampler1Bottleneck"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck $Sampler1Bottleneck FMAX"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x16EC01E0" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0380" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C8400" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0002" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F6600" />
+        <register type="NOA" address="0x00009888" value="0x100F0001" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CA200" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x082D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x0833C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x08370840" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x1ACE0200" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5300" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1CEC0000" />
+        <register type="NOA" address="0x00009888" value="0x0A9B8000" />
+        <register type="NOA" address="0x00009888" value="0x1C9C0002" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0002" />
+        <register type="NOA" address="0x00009888" value="0x0A8D8000" />
+        <register type="NOA" address="0x00009888" value="0x108F0001" />
+        <register type="NOA" address="0x00009888" value="0x16AC8000" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51907710" />
+        <register type="NOA" address="0x00009888" value="0x419020A0" />
+        <register type="NOA" address="0x00009888" value="0x55901515" />
+        <register type="NOA" address="0x00009888" value="0x45900529" />
+        <register type="NOA" address="0x00009888" value="0x47901025" />
+        <register type="NOA" address="0x00009888" value="0x57907770" />
+        <register type="NOA" address="0x00009888" value="0x49902100" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900108" />
+        <register type="NOA" address="0x00009888" value="0x59900007" />
+        <register type="NOA" address="0x00009888" value="0x43902108" />
+        <register type="NOA" address="0x00009888" value="0x53907777" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="4320492b-fd03-42ac-922f-dbe1ef3b7b58"
+       chipset="SKLGT3"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900863" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900C62" />
+        <register type="NOA" address="0x00009888" value="0x53903333" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="bd2d9cae-b9ec-4f5b-9d2f-934bed398a2d"
+       chipset="SKLGT3"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51901150" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x55905111" />
+        <register type="NOA" address="0x00009888" value="0x45901400" />
+        <register type="NOA" address="0x00009888" value="0x479004A5" />
+        <register type="NOA" address="0x00009888" value="0x57903455" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B9000A0" />
+        <register type="NOA" address="0x00009888" value="0x59900001" />
+        <register type="NOA" address="0x00009888" value="0x43900005" />
+        <register type="NOA" address="0x00009888" value="0x53900455" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="4ca0f3fe-7fd3-4924-98cb-1807d9879767"
+       chipset="SKLGT3"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="a0c0172c-ee13-403d-99ff-2bdf6936cf14"
+       chipset="SKLGT3"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="52435e0b-f188-42ea-8680-21a56ee20dee"
+       chipset="SKLGT3"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="27076eeb-49f3-4fed-8423-c66506005c63"
+       chipset="SKLGT3"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900063" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53903333" />
+        <register type="NOA" address="0x00009888" value="0x43900840" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="a1b8363b-b986-47b6-929a-847afde3dec8"
+       chipset="SKLGT3"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900005" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="fa857069-7f95-44c9-a3e0-cb8ccbc35abb"
+       chipset="SKLGT3"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="9830a5f3-a5e2-4773-a49d-6371407c382a"
+       chipset="SKLGT3"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="59452ceb-24bb-4878-87ec-87aab7b4f9db"
+       chipset="SKLGT3"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="d2249ff7-34b4-4203-b474-7c11546f9dae"
+       chipset="SKLGT3"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="c9cf7c63-0065-4226-941e-98590bad8f75"
+       chipset="SKLGT3"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="e3bb1501-89ca-43fb-8668-9d96159e10a2"
+       chipset="SKLGT3"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="29194a55-7e75-4152-a71f-ef34b1ae4cca"
+       chipset="SKLGT3"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="2d80a648-7b5a-4e92-bbe7-3b5c76f2e221"
+       chipset="SKLGT3"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active including Ext Math"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing including Extended Math processing"
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ  C 5 READ C 6 READ FADD C 7 READ FADD C 2 READ FADD C 3 READ FADD C 4 READ FADD 8 FMUL FADD 100 FMUL $EuCoresTotalCount FDIV $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active_adjusted"
+             units="percent"
+             symbol_name="Fpu1ActiveAdjusted"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x129203E0" />
+        <register type="NOA" address="0x00009888" value="0x12B203E0" />
+        <register type="NOA" address="0x00009888" value="0x12D203E0" />
+        <register type="NOA" address="0x00009888" value="0x024EC000" />
+        <register type="NOA" address="0x00009888" value="0x044EC000" />
+        <register type="NOA" address="0x00009888" value="0x064EC000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0042" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006D" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x00AF8000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC0001" />
+        <register type="NOA" address="0x00009888" value="0x008D8000" />
+        <register type="NOA" address="0x00009888" value="0x028DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F0001" />
+        <register type="NOA" address="0x00009888" value="0x06AC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AD4000" />
+        <register type="NOA" address="0x00009888" value="0x02908000" />
+        <register type="NOA" address="0x00009888" value="0x02918000" />
+        <register type="NOA" address="0x00009888" value="0x02921980" />
+        <register type="NOA" address="0x00009888" value="0x00920000" />
+        <register type="NOA" address="0x00009888" value="0x02934000" />
+        <register type="NOA" address="0x00009888" value="0x02B04000" />
+        <register type="NOA" address="0x00009888" value="0x02B14000" />
+        <register type="NOA" address="0x00009888" value="0x02B20033" />
+        <register type="NOA" address="0x00009888" value="0x00B20000" />
+        <register type="NOA" address="0x00009888" value="0x02B31000" />
+        <register type="NOA" address="0x00009888" value="0x00D08000" />
+        <register type="NOA" address="0x00009888" value="0x00D18000" />
+        <register type="NOA" address="0x00009888" value="0x00D21980" />
+        <register type="NOA" address="0x00009888" value="0x00D34000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900402" />
+        <register type="NOA" address="0x00009888" value="0x53901550" />
+        <register type="NOA" address="0x00009888" value="0x45900080" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="cfae9232-6ffc-42cc-a703-9790016925f0"
+       chipset="SKLGT3"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x149A5800" />
+        <register type="NOA" address="0x00009888" value="0x169A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12980240" />
+        <register type="NOA" address="0x00009888" value="0x14980002" />
+        <register type="NOA" address="0x00009888" value="0x1A4E3FC0" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C9500" />
+        <register type="NOA" address="0x00009888" value="0x0C4C002A" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0015" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C000A" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x04AFC000" />
+        <register type="NOA" address="0x00009888" value="0x06AF3000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0015" />
+        <register type="NOA" address="0x00009888" value="0x0A8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F4000" />
+        <register type="NOA" address="0x00009888" value="0x108F0015" />
+        <register type="NOA" address="0x00009888" value="0x16ACA000" />
+        <register type="NOA" address="0x00009888" value="0x18AC000A" />
+        <register type="NOA" address="0x00009888" value="0x06993000" />
+        <register type="NOA" address="0x00009888" value="0x0C9A28C1" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A93F000" />
+        <register type="NOA" address="0x00009888" value="0x0C93F000" />
+        <register type="NOA" address="0x00009888" value="0x0A97A000" />
+        <register type="NOA" address="0x00009888" value="0x0C97A000" />
+        <register type="NOA" address="0x00009888" value="0x0A980977" />
+        <register type="NOA" address="0x00009888" value="0x08980000" />
+        <register type="NOA" address="0x00009888" value="0x04980000" />
+        <register type="NOA" address="0x00009888" value="0x06983000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900050" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900115" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900884" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900002" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="0c5058ff-fdf4-4e0d-81fb-c0310fb76525"
+       chipset="SKLGT3"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x21D05800" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C25" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x21C05800" />
+        <register type="NOA" address="0x00009888" value="0x09D000A5" />
+        <register type="NOA" address="0x00009888" value="0x11D00000" />
+        <register type="NOA" address="0x00009888" value="0x05D00000" />
+        <register type="NOA" address="0x00009888" value="0x09D54000" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0996C000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x19938000" />
+        <register type="NOA" address="0x00009888" value="0x1B930068" />
+        <register type="NOA" address="0x00009888" value="0x15948000" />
+        <register type="NOA" address="0x00009888" value="0x1B94000C" />
+        <register type="NOA" address="0x00009888" value="0x03957500" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x17950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x07928000" />
+        <register type="NOA" address="0x00009888" value="0x03988000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x0BC000A5" />
+        <register type="NOA" address="0x00009888" value="0x11C00000" />
+        <register type="NOA" address="0x00009888" value="0x05C00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900463" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="2b985803-d3c9-4629-8a4f-634bfecba0e8"
+       chipset="SKLGT3"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="c889fd93-8dc7-4ba5-9451-de34a8b5ea3f"
+       chipset="SKLGT3"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/oa-sklgt4.xml b/lib/i915/perf-configs/oa-sklgt4.xml
new file mode 100644
index 00000000..b83fdd7a
--- /dev/null
+++ b/lib/i915/perf-configs/oa-sklgt4.xml
@@ -0,0 +1,10956 @@
+<?xml version="1.0"?>
+<metrics version="1562317147" merge_md5="">
+  <set name="Render Metrics Basic Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_basic"
+       hw_config_guid="95322a71-bb05-4437-bc27-f7dd7b27d136"
+       chipset="SKLGT4"
+       symbol_name="RenderBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Misses 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Cache Misses"
+             description="The total number of sampler cache misses in all LODs in all sampler units."
+             data_type="uint64"
+             equation="B 4 READ B 5 READ UADD B 3 READ UADD 8 UMUL"
+             underscore_name="sampler_l1_misses"
+             units="messages"
+             symbol_name="SamplerL1Misses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$SamplerL1Misses 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Sampler 0 Busy"
+             description="The percentage of time in which Sampler 0 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler0_busy"
+             units="percent"
+             symbol_name="Sampler0Busy"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler 1 Busy"
+             description="The percentage of time in which Sampler 1 has been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler1_busy"
+             units="percent"
+             symbol_name="Sampler1Busy"
+             availability="$SubsliceMask 0x12 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Samplers Busy"
+             description="The percentage of time in which samplers have been processing EU requests."
+             data_type="float"
+             max_equation="100"
+             equation="$Sampler0Busy $Sampler1Busy FMAX"
+             underscore_name="samplers_busy"
+             units="percent"
+             symbol_name="SamplersBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI Fixed Pipe Throughput"
+             description="The total number of GPU memory bytes transferred between 3D Pipeline (Command Dispatch, Input Assembly and Stream Output) and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="B 6 READ B 7 READ UADD 64 UMUL"
+             underscore_name="gti_vf_throughput"
+             units="bytes"
+             symbol_name="GtiVfThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/3D Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler 0 Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which Sampler 0 has been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             max_equation="100"
+             underscore_name="sampler0_bottleneck"
+             units="percent"
+             symbol_name="Sampler0Bottleneck"
+             availability="$SubsliceMask 0x09 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="L3 Lookup Accesses w/o IC"
+             description="The total number of L3 cache lookup accesses w/o IC."
+             data_type="uint64"
+             equation="$SamplerL1Misses $ShaderMemoryAccesses UADD"
+             underscore_name="l3_lookups"
+             units="messages"
+             symbol_name="L3Lookups"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Depth Throughput"
+             description="The total number of GPU memory bytes transferred between depth caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 0 READ C 1 READ UADD 64 UMUL"
+             underscore_name="gti_depth_throughput"
+             units="bytes"
+             symbol_name="GtiDepthThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Depth Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Samplers Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which samplers have been slowing down the pipe when processing EU requests."
+             data_type="float"
+             high_watermark="15"
+             equation="$Sampler0Bottleneck"
+             max_equation="100"
+             underscore_name="sampler_bottleneck"
+             units="percent"
+             symbol_name="SamplerBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Indicate System Frame Batch Draw"
+             mdapi_group="Sampler"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="GTI HDC TLB Lookup Throughput"
+             description="The total number of GPU memory bytes transferred between GTI and HDC, when HDC is doing TLB lookups."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_hdc_lookups_throughput"
+             units="bytes"
+             symbol_name="GtiHdcLookupsThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI RCC Throughput"
+             description="The total number of GPU memory bytes transferred between render color caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 2 READ C 3 READ UADD 64 UMUL"
+             underscore_name="gti_rcc_throughput"
+             units="bytes"
+             symbol_name="GtiRccThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/Color Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C01E0" />
+        <register type="NOA" address="0x00009888" value="0x12170280" />
+        <register type="NOA" address="0x00009888" value="0x12370280" />
+        <register type="NOA" address="0x00009888" value="0x16EC01E0" />
+        <register type="NOA" address="0x00009888" value="0x176C01E0" />
+        <register type="NOA" address="0x00009888" value="0x11930317" />
+        <register type="NOA" address="0x00009888" value="0x159303DF" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x1A4E03B0" />
+        <register type="NOA" address="0x00009888" value="0x0A6C0053" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A1B4000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0001" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x042F1000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CA400" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0002" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5600" />
+        <register type="NOA" address="0x00009888" value="0x100F0001" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x062D8000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x08133000" />
+        <register type="NOA" address="0x00009888" value="0x00170020" />
+        <register type="NOA" address="0x00009888" value="0x08170021" />
+        <register type="NOA" address="0x00009888" value="0x10170000" />
+        <register type="NOA" address="0x00009888" value="0x0633C000" />
+        <register type="NOA" address="0x00009888" value="0x06370800" />
+        <register type="NOA" address="0x00009888" value="0x10370000" />
+        <register type="NOA" address="0x00009888" value="0x1ACE0230" />
+        <register type="NOA" address="0x00009888" value="0x0AEC5300" />
+        <register type="NOA" address="0x00009888" value="0x10EC0000" />
+        <register type="NOA" address="0x00009888" value="0x1CEC0000" />
+        <register type="NOA" address="0x00009888" value="0x0A9B8000" />
+        <register type="NOA" address="0x00009888" value="0x1C9C0002" />
+        <register type="NOA" address="0x00009888" value="0x0ACC2000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0002" />
+        <register type="NOA" address="0x00009888" value="0x088D8000" />
+        <register type="NOA" address="0x00009888" value="0x0A8D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F1000" />
+        <register type="NOA" address="0x00009888" value="0x108F0001" />
+        <register type="NOA" address="0x00009888" value="0x16AC8800" />
+        <register type="NOA" address="0x00009888" value="0x1B4E0020" />
+        <register type="NOA" address="0x00009888" value="0x096C5300" />
+        <register type="NOA" address="0x00009888" value="0x116C0000" />
+        <register type="NOA" address="0x00009888" value="0x1D6C0000" />
+        <register type="NOA" address="0x00009888" value="0x091B8000" />
+        <register type="NOA" address="0x00009888" value="0x1B1C8000" />
+        <register type="NOA" address="0x00009888" value="0x0B4C2000" />
+        <register type="NOA" address="0x00009888" value="0x090D8000" />
+        <register type="NOA" address="0x00009888" value="0x0F0F1000" />
+        <register type="NOA" address="0x00009888" value="0x172C0800" />
+        <register type="NOA" address="0x00009888" value="0x0D933031" />
+        <register type="NOA" address="0x00009888" value="0x0F933E3F" />
+        <register type="NOA" address="0x00009888" value="0x01933D00" />
+        <register type="NOA" address="0x00009888" value="0x0393073C" />
+        <register type="NOA" address="0x00009888" value="0x0593000E" />
+        <register type="NOA" address="0x00009888" value="0x1D930000" />
+        <register type="NOA" address="0x00009888" value="0x19930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x2B908000" />
+        <register type="NOA" address="0x00009888" value="0x2D908000" />
+        <register type="NOA" address="0x00009888" value="0x2F908000" />
+        <register type="NOA" address="0x00009888" value="0x31908000" />
+        <register type="NOA" address="0x00009888" value="0x15908000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x5190FF30" />
+        <register type="NOA" address="0x00009888" value="0x41900060" />
+        <register type="NOA" address="0x00009888" value="0x55903033" />
+        <register type="NOA" address="0x00009888" value="0x45901421" />
+        <register type="NOA" address="0x00009888" value="0x47900803" />
+        <register type="NOA" address="0x00009888" value="0x5790FFF1" />
+        <register type="NOA" address="0x00009888" value="0x49900001" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x5990000F" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x5390FFFF" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00222222" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Basic Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_basic"
+       hw_config_guid="7277228f-e7f3-4743-945a-6a2049d11377"
+       chipset="SKLGT4"
+       symbol_name="ComputeBasic"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 6 READ B 7 READ C 0 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_read"
+             units="bytes"
+             symbol_name="UntypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Bytes Written"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 3 READ B 4 READ B 5 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_written"
+             units="bytes"
+             symbol_name="TypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Untyped Writes"
+             description="The total number of untyped memory bytes written via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 1 READ C 2 READ C 3 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="untyped_bytes_written"
+             units="bytes"
+             symbol_name="UntypedBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="Typed Bytes Read"
+             description="The total number of typed memory bytes read via Data Port."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="B 0 READ B 1 READ B 2 READ UADD UADD $EuSlicesTotalCount 64 UMUL UMUL"
+             underscore_name="typed_bytes_read"
+             units="bytes"
+             symbol_name="TypedBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 5 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO OCL BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F00E0" />
+        <register type="NOA" address="0x00009888" value="0x124F1C00" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E0820" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x064F0900" />
+        <register type="NOA" address="0x00009888" value="0x084F0032" />
+        <register type="NOA" address="0x00009888" value="0x0A4F1891" />
+        <register type="NOA" address="0x00009888" value="0x0C4F0E00" />
+        <register type="NOA" address="0x00009888" value="0x0E4F003C" />
+        <register type="NOA" address="0x00009888" value="0x004F0D80" />
+        <register type="NOA" address="0x00009888" value="0x024F003B" />
+        <register type="NOA" address="0x00009888" value="0x006C0002" />
+        <register type="NOA" address="0x00009888" value="0x086C0100" />
+        <register type="NOA" address="0x00009888" value="0x0C6C000C" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B00" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x081B8000" />
+        <register type="NOA" address="0x00009888" value="0x0C1B4000" />
+        <register type="NOA" address="0x00009888" value="0x0E1B8000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C8000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0024" />
+        <register type="NOA" address="0x00009888" value="0x065B8000" />
+        <register type="NOA" address="0x00009888" value="0x085B4000" />
+        <register type="NOA" address="0x00009888" value="0x0A5BC000" />
+        <register type="NOA" address="0x00009888" value="0x0C5B8000" />
+        <register type="NOA" address="0x00009888" value="0x0E5B4000" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C6000" />
+        <register type="NOA" address="0x00009888" value="0x1C5C001B" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0208" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2CC000" />
+        <register type="NOA" address="0x00009888" value="0x162CFB00" />
+        <register type="NOA" address="0x00009888" value="0x182C00BE" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x19900157" />
+        <register type="NOA" address="0x00009888" value="0x1B900158" />
+        <register type="NOA" address="0x00009888" value="0x1D900105" />
+        <register type="NOA" address="0x00009888" value="0x1F900103" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x11900FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900821" />
+        <register type="NOA" address="0x00009888" value="0x47900802" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900802" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900422" />
+        <register type="NOA" address="0x00009888" value="0x53905555" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Render Metrics for 3D Pipeline Profile Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="render_pipe_profile"
+       hw_config_guid="463c668c-3f60-49b6-8f85-d995b635b3b2"
+       chipset="SKLGT4"
+       symbol_name="RenderPipeProfile"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which vertex shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_bottleneck"
+             units="percent"
+             symbol_name="VsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Hi-Depth Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which early hierarchical depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hi_depth_bottleneck"
+             units="percent"
+             symbol_name="HiDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which geometry shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gs_bottleneck"
+             units="percent"
+             symbol_name="GsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Geometry Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="BC Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which barycentric coordinates calculation pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="bc_bottleneck"
+             units="percent"
+             symbol_name="BcBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Barycentric Calc"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Stall"
+             description="The percentage of time in which hull stall pipeline stage was stalled."
+             data_type="float"
+             equation="C 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_stall"
+             units="percent"
+             symbol_name="HsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Hull Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="VF Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which vertex fetch pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="C 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vf_bottleneck"
+             units="percent"
+             symbol_name="VfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Input Assembler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Strip-Fans Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which strip-fans pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="10"
+             equation="B 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_bottleneck"
+             units="percent"
+             symbol_name="SfBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SF Stall"
+             description="The percentage of time in which strip-fans pipeline stage was stalled."
+             data_type="float"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sf_stall"
+             units="percent"
+             symbol_name="SfStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Strip-Fans"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="HS Bottleneck"
+             low_watermark="3"
+             description="The percentage of time in which hull shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="9"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="hs_bottleneck"
+             units="percent"
+             symbol_name="HsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Hull Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CL Stall"
+             description="The percentage of time in which clipper pipeline stage was stalled."
+             data_type="float"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_stall"
+             units="percent"
+             symbol_name="ClStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Clipper"
+             />
+    <counter name="SO Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which stream output pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_bottleneck"
+             units="percent"
+             symbol_name="SoBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Stream Output"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="DS Bottleneck"
+             low_watermark="5"
+             description="The percentage of time in which domain shader pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="15"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_bottleneck"
+             units="percent"
+             symbol_name="DsBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Domain Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Clipper Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which clipper pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="cl_bottleneck"
+             units="percent"
+             symbol_name="ClBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Clipper"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Stall"
+             description="The percentage of time in which domain shader pipeline stage was stalled."
+             data_type="float"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ds_stall"
+             units="percent"
+             symbol_name="DsStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Domain Shader"
+             />
+    <counter name="Early Depth Bottleneck"
+             low_watermark="10"
+             description="The percentage of time in which early depth test pipeline stage was slowing down the 3D pipeline."
+             data_type="float"
+             high_watermark="30"
+             equation="B 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="early_depth_bottleneck"
+             units="percent"
+             symbol_name="EarlyDepthBottleneck"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Indicate Draw"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SO Stall"
+             description="The percentage of time in which stream-output pipeline stage was stalled."
+             data_type="float"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="so_stall"
+             units="percent"
+             symbol_name="SoStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Correlate Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Stream Output"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x0C0E001F" />
+        <register type="NOA" address="0x00009888" value="0x0A0F0000" />
+        <register type="NOA" address="0x00009888" value="0x10116800" />
+        <register type="NOA" address="0x00009888" value="0x178A03E0" />
+        <register type="NOA" address="0x00009888" value="0x11824C00" />
+        <register type="NOA" address="0x00009888" value="0x11830020" />
+        <register type="NOA" address="0x00009888" value="0x13840020" />
+        <register type="NOA" address="0x00009888" value="0x11850019" />
+        <register type="NOA" address="0x00009888" value="0x11860007" />
+        <register type="NOA" address="0x00009888" value="0x01870C40" />
+        <register type="NOA" address="0x00009888" value="0x17880000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0040" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x040D4000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020E5400" />
+        <register type="NOA" address="0x00009888" value="0x000E0000" />
+        <register type="NOA" address="0x00009888" value="0x080F0040" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x100F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0040" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06110012" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x01898000" />
+        <register type="NOA" address="0x00009888" value="0x0D890100" />
+        <register type="NOA" address="0x00009888" value="0x03898000" />
+        <register type="NOA" address="0x00009888" value="0x09808000" />
+        <register type="NOA" address="0x00009888" value="0x0B808000" />
+        <register type="NOA" address="0x00009888" value="0x0380C000" />
+        <register type="NOA" address="0x00009888" value="0x0F8A0075" />
+        <register type="NOA" address="0x00009888" value="0x1D8A0000" />
+        <register type="NOA" address="0x00009888" value="0x118A8000" />
+        <register type="NOA" address="0x00009888" value="0x1B8A4000" />
+        <register type="NOA" address="0x00009888" value="0x138A8000" />
+        <register type="NOA" address="0x00009888" value="0x1D81A000" />
+        <register type="NOA" address="0x00009888" value="0x15818000" />
+        <register type="NOA" address="0x00009888" value="0x17818000" />
+        <register type="NOA" address="0x00009888" value="0x0B820030" />
+        <register type="NOA" address="0x00009888" value="0x07828000" />
+        <register type="NOA" address="0x00009888" value="0x0D824000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x05824000" />
+        <register type="NOA" address="0x00009888" value="0x0D830003" />
+        <register type="NOA" address="0x00009888" value="0x0583000C" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x03838000" />
+        <register type="NOA" address="0x00009888" value="0x07838000" />
+        <register type="NOA" address="0x00009888" value="0x0B840980" />
+        <register type="NOA" address="0x00009888" value="0x03844D80" />
+        <register type="NOA" address="0x00009888" value="0x11840000" />
+        <register type="NOA" address="0x00009888" value="0x09848000" />
+        <register type="NOA" address="0x00009888" value="0x09850080" />
+        <register type="NOA" address="0x00009888" value="0x03850003" />
+        <register type="NOA" address="0x00009888" value="0x01850000" />
+        <register type="NOA" address="0x00009888" value="0x07860000" />
+        <register type="NOA" address="0x00009888" value="0x0F860400" />
+        <register type="NOA" address="0x00009888" value="0x09870032" />
+        <register type="NOA" address="0x00009888" value="0x01888052" />
+        <register type="NOA" address="0x00009888" value="0x11880000" />
+        <register type="NOA" address="0x00009888" value="0x09884000" />
+        <register type="NOA" address="0x00009888" value="0x1B931001" />
+        <register type="NOA" address="0x00009888" value="0x1D930001" />
+        <register type="NOA" address="0x00009888" value="0x19934000" />
+        <register type="NOA" address="0x00009888" value="0x1B958000" />
+        <register type="NOA" address="0x00009888" value="0x1D950094" />
+        <register type="NOA" address="0x00009888" value="0x19958000" />
+        <register type="NOA" address="0x00009888" value="0x09E58000" />
+        <register type="NOA" address="0x00009888" value="0x0BE58000" />
+        <register type="NOA" address="0x00009888" value="0x03E5C000" />
+        <register type="NOA" address="0x00009888" value="0x0592C000" />
+        <register type="NOA" address="0x00009888" value="0x0B928000" />
+        <register type="NOA" address="0x00009888" value="0x0D924000" />
+        <register type="NOA" address="0x00009888" value="0x0F924000" />
+        <register type="NOA" address="0x00009888" value="0x11928000" />
+        <register type="NOA" address="0x00009888" value="0x1392C000" />
+        <register type="NOA" address="0x00009888" value="0x09924000" />
+        <register type="NOA" address="0x00009888" value="0x01985000" />
+        <register type="NOA" address="0x00009888" value="0x07988000" />
+        <register type="NOA" address="0x00009888" value="0x09981000" />
+        <register type="NOA" address="0x00009888" value="0x0B982000" />
+        <register type="NOA" address="0x00009888" value="0x0D982000" />
+        <register type="NOA" address="0x00009888" value="0x0F989000" />
+        <register type="NOA" address="0x00009888" value="0x05982000" />
+        <register type="NOA" address="0x00009888" value="0x13904000" />
+        <register type="NOA" address="0x00009888" value="0x21904000" />
+        <register type="NOA" address="0x00009888" value="0x23904000" />
+        <register type="NOA" address="0x00009888" value="0x25908000" />
+        <register type="NOA" address="0x00009888" value="0x27904000" />
+        <register type="NOA" address="0x00009888" value="0x29908000" />
+        <register type="NOA" address="0x00009888" value="0x2B904000" />
+        <register type="NOA" address="0x00009888" value="0x2F904000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x15904000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B904000" />
+        <register type="NOA" address="0x00009888" value="0x1190C080" />
+        <register type="NOA" address="0x00009888" value="0x51901110" />
+        <register type="NOA" address="0x00009888" value="0x41900440" />
+        <register type="NOA" address="0x00009888" value="0x55901111" />
+        <register type="NOA" address="0x00009888" value="0x45900400" />
+        <register type="NOA" address="0x00009888" value="0x47900C21" />
+        <register type="NOA" address="0x00009888" value="0x57901411" />
+        <register type="NOA" address="0x00009888" value="0x49900042" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900024" />
+        <register type="NOA" address="0x00009888" value="0x59900001" />
+        <register type="NOA" address="0x00009888" value="0x43900841" />
+        <register type="NOA" address="0x00009888" value="0x53900411" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFEA" />
+        <register type="OA" address="0x00002774" value="0x00007FFC" />
+        <register type="OA" address="0x00002778" value="0x0007AFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000F5FD" />
+        <register type="OA" address="0x00002780" value="0x00079FFA" />
+        <register type="OA" address="0x00002784" value="0x0000F3FB" />
+        <register type="OA" address="0x00002788" value="0x0007BF7A" />
+        <register type="OA" address="0x0000278C" value="0x0000F7E7" />
+        <register type="OA" address="0x00002790" value="0x0007FEFA" />
+        <register type="OA" address="0x00002794" value="0x0000F7CF" />
+        <register type="OA" address="0x00002798" value="0x00077FFA" />
+        <register type="OA" address="0x0000279C" value="0x0000EFDF" />
+        <register type="OA" address="0x000027A0" value="0x0006FFFA" />
+        <register type="OA" address="0x000027A4" value="0x0000CFBF" />
+        <register type="OA" address="0x000027A8" value="0x0003FFFA" />
+        <register type="OA" address="0x000027AC" value="0x00005F7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Reads Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_reads"
+       hw_config_guid="3ae6e74c-72c3-4040-9bd0-7961430b8cc8"
+       chipset="SKLGT4"
+       symbol_name="MemoryReads"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank0Reads"
+             description="The total number of GTI memory reads from L3 Bank 0 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_reads"
+             units="messages"
+             symbol_name="GtiL3Bank0Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all accesses from GTI to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiL3Bank3Reads"
+             description="The total number of GTI memory reads from L3 Bank 3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_reads"
+             units="messages"
+             symbol_name="GtiL3Bank3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiRsMemoryReads"
+             description="The total number of GTI memory reads from Resource Streamer."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_rs_memory_reads"
+             units="messages"
+             symbol_name="GtiRsMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Resource Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiHizMemoryReads"
+             description="The total number of GTI memory reads from Hierarchical Depth Cache (Hi-Depth Cache misses)."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_reads"
+             units="messages"
+             symbol_name="GtiHizMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="GtiRccMemoryReads"
+             description="The total number of GTI memory reads from Render Color Cache (Render Color Cache misses)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_reads"
+             units="messages"
+             symbol_name="GtiRccMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Bank1Reads"
+             description="The total number of GTI memory reads from L3 Bank 1 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_reads"
+             units="messages"
+             symbol_name="GtiL3Bank1Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiCmdStreamerMemoryReads"
+             description="The total number of GTI memory reads from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_reads"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="GtiL3Bank2Reads"
+             description="The total number of GTI memory reads from L3 Bank 2 (L3 Cache misses)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_reads"
+             units="messages"
+             symbol_name="GtiL3Bank2Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiMemoryReads"
+             description="The total number of GTI memory reads."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_reads"
+             units="messages"
+             symbol_name="GtiMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="GtiRczMemoryReads"
+             description="The total number of GTI memory reads from Render Depth Cache (Render Depth Cache misses)."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_reads"
+             units="messages"
+             symbol_name="GtiRczMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="GtiMscMemoryReads"
+             description="The total number of GTI memory reads from Multisampling Color Cache (Multisampling Color Cache misses)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_reads"
+             units="messages"
+             symbol_name="GtiMscMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiVfMemoryReads"
+             description="The total number of GTI memory reads from Vertex Fetch."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="gti_vf_memory_reads"
+             units="messages"
+             symbol_name="GtiVfMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Vertex Fetch"
+             />
+    <counter name="GtiStcMemoryReads"
+             description="The total number of GTI memory reads from Stencil Cache (Stencil Cache misses)."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_reads"
+             units="messages"
+             symbol_name="GtiStcMemoryReads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiL3Reads"
+             description="The total number of GTI memory reads from L3 (L3 Cache misses)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Reads $GtiL3Bank1Reads $GtiL3Bank2Reads $GtiL3Bank3Reads UADD UADD UADD"
+             underscore_name="gti_l3_reads"
+             units="messages"
+             symbol_name="GtiL3Reads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F900064" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900150" />
+        <register type="NOA" address="0x00009888" value="0x21900151" />
+        <register type="NOA" address="0x00009888" value="0x23900152" />
+        <register type="NOA" address="0x00009888" value="0x25900153" />
+        <register type="NOA" address="0x00009888" value="0x27900154" />
+        <register type="NOA" address="0x00009888" value="0x29900155" />
+        <register type="NOA" address="0x00009888" value="0x2B900156" />
+        <register type="NOA" address="0x00009888" value="0x2D900157" />
+        <register type="NOA" address="0x00009888" value="0x2F90015F" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F872" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Memory Writes Distribution Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="memory_writes"
+       hw_config_guid="055f256d-4052-467c-8dec-6064a4806433"
+       chipset="SKLGT4"
+       symbol_name="MemoryWrites"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiMemoryWrites"
+             description="The total number of GTI memory writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="gti_memory_writes"
+             units="messages"
+             symbol_name="GtiMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="GtiRingAccesses"
+             description="The total number of all GTI accesses to the ring."
+             data_type="uint64"
+             equation="C 3 READ 2 UMUL"
+             underscore_name="gti_ring_accesses"
+             units="messages"
+             symbol_name="GtiRingAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="GtiMscMemoryWrites"
+             description="The total number of GTI memory writes from Multisampling Color Cache (Multisampling Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="gti_msc_memory_writes"
+             units="messages"
+             symbol_name="GtiMscMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="GtiCmdStreamerMemoryWrites"
+             description="The total number of GTI memory writes from Command Streamer."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="gti_cmd_streamer_memory_writes"
+             units="messages"
+             symbol_name="GtiCmdStreamerMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Command Streamer"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GtiL3Bank0Writes"
+             description="The total number of GTI memory writes from L3 Bank 0 (L3 Bank 0 invalidations)."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="gti_l3_bank0_writes"
+             units="messages"
+             symbol_name="GtiL3Bank0Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank1Writes"
+             description="The total number of GTI memory writes from L3 Bank 1 (L3 Bank 1 invalidations)."
+             data_type="uint64"
+             equation="C 5 READ"
+             underscore_name="gti_l3_bank1_writes"
+             units="messages"
+             symbol_name="GtiL3Bank1Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank2Writes"
+             description="The total number of GTI memory writes from L3 Bank 2 (L3 Bank 2 invalidations)."
+             data_type="uint64"
+             equation="C 6 READ"
+             underscore_name="gti_l3_bank2_writes"
+             units="messages"
+             symbol_name="GtiL3Bank2Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Bank3Writes"
+             description="The total number of GTI memory writes from L3 Bank 3 (L3 Bank 3 invalidations)."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="gti_l3_bank3_writes"
+             units="messages"
+             symbol_name="GtiL3Bank3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GtiL3Writes"
+             description="The total number of GTI memory writes from L3 (L3 invalidations)."
+             data_type="uint64"
+             equation="$GtiL3Bank0Writes $GtiL3Bank1Writes $GtiL3Bank2Writes $GtiL3Bank3Writes UADD UADD UADD"
+             underscore_name="gti_l3_writes"
+             units="messages"
+             symbol_name="GtiL3Writes"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/L3"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiRccMemoryWrites"
+             description="The total number of GTI memory writes from Render Color Cache (Render Color Cache invalidations)."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="gti_rcc_memory_writes"
+             units="messages"
+             symbol_name="GtiRccMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Color Cache"
+             />
+    <counter name="GtiSoMemoryWrites"
+             description="The total number of GTI memory writes from Stream Output."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="gti_so_memory_writes"
+             units="messages"
+             symbol_name="GtiSoMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/3D Pipe/Stream Output"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GtiStcMemoryWrites"
+             description="The total number of GTI memory writes from Stencil Cache."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="gti_stc_memory_writes"
+             units="messages"
+             symbol_name="GtiStcMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="GtiRczMemoryWrites"
+             description="The total number of GTI memory writes from Render Depth Cache."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="gti_rcz_memory_writes"
+             units="messages"
+             symbol_name="GtiRczMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="GtiHizMemoryWrites"
+             description="The total number of GTI memory writes from Hierarchical Depth Cache."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="gti_hiz_memory_writes"
+             units="messages"
+             symbol_name="GtiHizMemoryWrites"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GTI/Depth Cache"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810C00" />
+        <register type="NOA" address="0x00009888" value="0x1381001A" />
+        <register type="NOA" address="0x00009888" value="0x37906800" />
+        <register type="NOA" address="0x00009888" value="0x3F901000" />
+        <register type="NOA" address="0x00009888" value="0x03811300" />
+        <register type="NOA" address="0x00009888" value="0x05811B12" />
+        <register type="NOA" address="0x00009888" value="0x0781001A" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x17810000" />
+        <register type="NOA" address="0x00009888" value="0x19810000" />
+        <register type="NOA" address="0x00009888" value="0x1B810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930055" />
+        <register type="NOA" address="0x00009888" value="0x03E58000" />
+        <register type="NOA" address="0x00009888" value="0x05E5C000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x13900160" />
+        <register type="NOA" address="0x00009888" value="0x21900161" />
+        <register type="NOA" address="0x00009888" value="0x23900162" />
+        <register type="NOA" address="0x00009888" value="0x25900163" />
+        <register type="NOA" address="0x00009888" value="0x27900164" />
+        <register type="NOA" address="0x00009888" value="0x29900165" />
+        <register type="NOA" address="0x00009888" value="0x2B900166" />
+        <register type="NOA" address="0x00009888" value="0x2D900167" />
+        <register type="NOA" address="0x00009888" value="0x2F900150" />
+        <register type="NOA" address="0x00009888" value="0x31900105" />
+        <register type="NOA" address="0x00009888" value="0x15900103" />
+        <register type="NOA" address="0x00009888" value="0x17900101" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C60" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900C63" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C63" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900063" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x0000272C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002728" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x0000271C" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002718" value="0xFFFFFFFF" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x0000274C" value="0x86543210" />
+        <register type="OA" address="0x00002748" value="0x86543210" />
+        <register type="OA" address="0x00002744" value="0x00006667" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x0000275C" value="0x86543210" />
+        <register type="OA" address="0x00002758" value="0x86543210" />
+        <register type="OA" address="0x00002754" value="0x00006465" />
+        <register type="OA" address="0x00002750" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007F81A" />
+        <register type="OA" address="0x00002774" value="0x0000FE00" />
+        <register type="OA" address="0x00002778" value="0x0007F82A" />
+        <register type="OA" address="0x0000277C" value="0x0000FE00" />
+        <register type="OA" address="0x00002780" value="0x0007F822" />
+        <register type="OA" address="0x00002784" value="0x0000FE00" />
+        <register type="OA" address="0x00002788" value="0x0007F8BA" />
+        <register type="OA" address="0x0000278C" value="0x0000FE00" />
+        <register type="OA" address="0x00002790" value="0x0007F87A" />
+        <register type="OA" address="0x00002794" value="0x0000FE00" />
+        <register type="OA" address="0x00002798" value="0x0007F8EA" />
+        <register type="OA" address="0x0000279C" value="0x0000FE00" />
+        <register type="OA" address="0x000027A0" value="0x0007F8E2" />
+        <register type="OA" address="0x000027A4" value="0x0000FE00" />
+        <register type="OA" address="0x000027A8" value="0x0007F8F2" />
+        <register type="OA" address="0x000027AC" value="0x0000FE00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00015014" />
+        <register type="FLEX" address="0x0000E658" value="0x00025024" />
+        <register type="FLEX" address="0x0000E758" value="0x00035034" />
+        <register type="FLEX" address="0x0000E45C" value="0x00045044" />
+        <register type="FLEX" address="0x0000E55C" value="0x00055054" />
+        <register type="FLEX" address="0x0000E65C" value="0x00065064" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extended Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extended"
+       hw_config_guid="753972d4-87cd-4460-824d-754463ac5054"
+       chipset="SKLGT4"
+       symbol_name="ComputeExtended"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Typed Writes 0"
+             description="The subslice 0 typed writes."
+             data_type="uint64"
+             equation="C 0 READ"
+             underscore_name="typed_writes0"
+             units="messages"
+             symbol_name="TypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuTypedAtomics0"
+             description="The subslice 0 EU Typed Atomics subslice 0."
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="eu_typed_atomics0"
+             units="messages"
+             symbol_name="EuTypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Atomics 0"
+             description="The subslice 0 typed atomics."
+             data_type="uint64"
+             equation="C 4 READ"
+             underscore_name="typed_atomics0"
+             units="messages"
+             symbol_name="TypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedAtomicsPerCacheLine"
+             description="The ratio of EU typed atomics requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedAtomics0 $TypedAtomics0 FDIV"
+             underscore_name="typed_atomics_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedAtomicsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedReads0"
+             description="The subslice 0 EU Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="eu_untyped_reads0"
+             units="messages"
+             symbol_name="EuUntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Writes 0"
+             description="The subslice 0 untyped writes (including SLM writes)."
+             data_type="uint64"
+             equation="C 1 READ"
+             underscore_name="untyped_writes0"
+             units="messages"
+             symbol_name="UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedAtomics0"
+             description="The subslice 0 EU Untyped Atomics subslice 0."
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="eu_untyped_atomics0"
+             units="messages"
+             symbol_name="EuUntypedAtomics0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuUntypedWrites0"
+             description="The subslice 0 EU Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="eu_untyped_writes0"
+             units="messages"
+             symbol_name="EuUntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedWrites0"
+             description="The subslice 0 EU A64 Untyped Writes subslice 0."
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="eu_a64_untyped_writes0"
+             units="messages"
+             symbol_name="EuA64UntypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedWritesPerCacheLine"
+             description="The ratio of EU untyped write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuUntypedWrites0 $EuA64UntypedWrites0 UADD $UntypedWrites0 FDIV"
+             underscore_name="untyped_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedWrites0"
+             description="The subslice 0 EU Typed Writes subslice 0."
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="eu_typed_writes0"
+             units="messages"
+             symbol_name="EuTypedWrites0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedWritesPerCacheLine"
+             description="The ratio of EU typed write requests to L3 cache line writes."
+             data_type="float"
+             equation="$EuTypedWrites0 $TypedWrites0 FDIV"
+             underscore_name="typed_writes_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedWritesPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Typed Reads 0"
+             description="The subslice 0 typed reads."
+             data_type="uint64"
+             equation="C 2 READ"
+             underscore_name="typed_reads0"
+             units="messages"
+             symbol_name="TypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Untyped Reads 0"
+             description="The subslice 0 untyped reads (including SLM reads)."
+             data_type="uint64"
+             equation="C 3 READ"
+             underscore_name="untyped_reads0"
+             units="messages"
+             symbol_name="UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EuA64UntypedReads0"
+             description="The subslice 0 EU A64 Untyped Reads subslice 0."
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="eu_a64_untyped_reads0"
+             units="messages"
+             symbol_name="EuA64UntypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ 8 UMUL $EuCoresTotalCount UDIV $EuThreadsCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EuTypedReads0"
+             description="The subslice 0 EU Typed Reads subslice 0."
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="eu_typed_reads0"
+             units="messages"
+             symbol_name="EuTypedReads0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="UntypedReadsPerCacheLine"
+             description="The ratio of EU untyped read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuUntypedReads0 $EuA64UntypedReads0 UADD $UntypedReads0 FDIV"
+             underscore_name="untyped_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="UntypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="TypedReadsPerCacheLine"
+             description="The ratio of EU typed read requests to L3 cache line reads."
+             data_type="float"
+             equation="$EuTypedReads0 $TypedReads0 FDIV"
+             underscore_name="typed_reads_per_cache_line"
+             units="eu sends to l3 cache lines"
+             symbol_name="TypedReadsPerCacheLine"
+             semantic_type="ratio"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="subslice"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x106C00E0" />
+        <register type="NOA" address="0x00009888" value="0x141C8160" />
+        <register type="NOA" address="0x00009888" value="0x161C8015" />
+        <register type="NOA" address="0x00009888" value="0x181C0120" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4EAAA0" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E6C0B01" />
+        <register type="NOA" address="0x00009888" value="0x006C0200" />
+        <register type="NOA" address="0x00009888" value="0x026C000C" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x001C0041" />
+        <register type="NOA" address="0x00009888" value="0x061C4200" />
+        <register type="NOA" address="0x00009888" value="0x081C4443" />
+        <register type="NOA" address="0x00009888" value="0x0A1C4645" />
+        <register type="NOA" address="0x00009888" value="0x0C1C7647" />
+        <register type="NOA" address="0x00009888" value="0x041C7357" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x101C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0000" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4CAA2A" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02AA" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x000DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5515" />
+        <register type="NOA" address="0x00009888" value="0x100F0155" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x11907FFF" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900040" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900802" />
+        <register type="NOA" address="0x00009888" value="0x47900842" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900842" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x43900800" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FC2A" />
+        <register type="OA" address="0x00002774" value="0x0000BF00" />
+        <register type="OA" address="0x00002778" value="0x0007FC6A" />
+        <register type="OA" address="0x0000277C" value="0x0000BF00" />
+        <register type="OA" address="0x00002780" value="0x0007FC92" />
+        <register type="OA" address="0x00002784" value="0x0000BF00" />
+        <register type="OA" address="0x00002788" value="0x0007FCA2" />
+        <register type="OA" address="0x0000278C" value="0x0000BF00" />
+        <register type="OA" address="0x00002790" value="0x0007FC32" />
+        <register type="OA" address="0x00002794" value="0x0000BF00" />
+        <register type="OA" address="0x00002798" value="0x0007FC9A" />
+        <register type="OA" address="0x0000279C" value="0x0000BF00" />
+        <register type="OA" address="0x000027A0" value="0x0007FE6A" />
+        <register type="OA" address="0x000027A4" value="0x0000BF00" />
+        <register type="OA" address="0x000027A8" value="0x0007FE7A" />
+        <register type="OA" address="0x000027AC" value="0x0000BF00" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00778008" />
+        <register type="FLEX" address="0x0000E45C" value="0x00088078" />
+        <register type="FLEX" address="0x0000E55C" value="0x00808708" />
+        <register type="FLEX" address="0x0000E65C" value="0x00A08908" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics L3 Cache Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_l3_cache"
+       hw_config_guid="4e4392e9-8f73-457b-ab44-b49f7a0c733b"
+       chipset="SKLGT4"
+       symbol_name="ComputeL3Cache"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 03 Accesses"
+             description="The total number of accesses to L3 Bank 03."
+             data_type="uint64"
+             equation="B 3 READ 2 UMUL"
+             underscore_name="l3_bank03_accesses"
+             units="messages"
+             symbol_name="L3Bank03Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="L3 Accesses"
+             description="The total number of L3 accesses from all entities."
+             data_type="uint64"
+             equation="C 0 READ C 1 READ B 2 READ B 3 READ UADD UADD UADD 2 UMUL"
+             underscore_name="l3_accesses"
+             units="messages"
+             symbol_name="L3Accesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Sampler Throughput"
+             description="The total number of GPU memory bytes transferred between samplers and L3 caches."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="A 29 READ 64 UMUL"
+             underscore_name="l3_sampler_throughput"
+             units="bytes"
+             symbol_name="L3SamplerThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Sampler"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu0_active"
+             units="percent"
+             symbol_name="Fpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU AVG IPC Rate"
+             description="The average rate of IPC calculated for 2 FPU pipelines."
+             data_type="float"
+             max_equation="2"
+             equation="A 9 READ  A 10 READ  A 11 READ UADD  A 9 READ USUB FDIV 1 FADD"
+             underscore_name="eu_avg_ipc_rate"
+             units="number"
+             symbol_name="EuAvgIpcRate"
+             semantic_type="ratio"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="EU FPU0 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 13 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu0_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Misses"
+             description="The total number of L3 misses."
+             data_type="uint64"
+             equation="C 4 READ C 5 READ UADD"
+             underscore_name="l3_misses"
+             units="messages"
+             symbol_name="L3Misses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/TAG"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="L3 Bank 00 Accesses"
+             description="The total number of accesses to L3 Bank 00."
+             data_type="uint64"
+             equation="C 0 READ 2 UMUL"
+             underscore_name="l3_bank00_accesses"
+             units="messages"
+             symbol_name="L3Bank00Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="EU FPU0 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 19 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu0_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Hybrid Instruction"
+             description="The percentage of time in which execution units were actively processing hybrid instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 14 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_hybrid_fpu1_instruction"
+             units="percent"
+             symbol_name="EuHybridFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Read Throughput"
+             description="The total number of GPU memory bytes read from GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL"
+             equation="C 6 READ 64 UMUL"
+             underscore_name="gti_read_throughput"
+             units="bytes"
+             symbol_name="GtiReadThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI L3 Throughput"
+             description="The total number of GPU memory bytes transferred between L3 caches and GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="C 4 READ C 5 READ UADD 64 UMUL"
+             underscore_name="gti_l3_throughput"
+             units="bytes"
+             symbol_name="GtiL3Throughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Bank 00 IC Accesses"
+             description="The total number of accesses to L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 0 READ B 1 READ UADD 2 UMUL $L3Bank00Accesses UMIN"
+             underscore_name="l3_bank00_ic_accesses"
+             units="messages"
+             symbol_name="L3Bank00IcAccesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="L3 Bank 00 IC Hits"
+             description="The total number of hits in L3 Bank 00 from IC cache."
+             data_type="uint64"
+             equation="B 1 READ 2 UMUL $L3Bank00IcAccesses UMIN"
+             underscore_name="l3_bank00_ic_hits"
+             units="messages"
+             symbol_name="L3Bank00IcHits"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3/IC"
+             />
+    <counter name="Sampler Accesses"
+             description="The total number of messages send to samplers."
+             data_type="uint64"
+             equation="A 28 READ"
+             underscore_name="sampler_accesses"
+             units="messages"
+             symbol_name="SamplerAccesses"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler"
+             />
+    <counter name="L3 Bank 01 Accesses"
+             description="The total number of accesses to L3 Bank 01."
+             data_type="uint64"
+             equation="C 1 READ 2 UMUL"
+             underscore_name="l3_bank01_accesses"
+             units="messages"
+             symbol_name="L3Bank01Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU0 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU0."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu0_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu0Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU FPU1 Move Instruction"
+             description="The percentage of time in which execution units were actively processing move instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 20 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_move_fpu1_instruction"
+             units="percent"
+             symbol_name="EuMoveFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="L3 Bank 02 Accesses"
+             description="The total number of accesses to L3 Bank 02."
+             data_type="uint64"
+             equation="B 2 READ 2 UMUL"
+             underscore_name="l3_bank02_accesses"
+             units="messages"
+             symbol_name="L3Bank02Accesses"
+             availability="$SliceMask 0x01 AND"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_hw_unit_type="slice"
+             mdapi_group="L3"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="L3 Total Throughput"
+             description="The total number of GPU memory bytes transferred via L3."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSlicesTotalCount UMUL"
+             equation="$L3Accesses 64 UMUL"
+             underscore_name="l3_total_throughput"
+             units="bytes"
+             symbol_name="L3TotalThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GTI Write Throughput"
+             description="The total number of GPU memory bytes written to GTI."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 32 UMUL"
+             equation="C 7 READ 64 UMUL"
+             underscore_name="gti_write_throughput"
+             units="bytes"
+             symbol_name="GtiWriteThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="EU FPU1 Binary Instruction"
+             description="The percentage of time in which execution units were actively processing binary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_binary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuBinaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU FPU1 Ternary Instruction"
+             description="The percentage of time in which execution units were actively processing ternary instructions on FPU1."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_ternary_fpu1_instruction"
+             units="percent"
+             symbol_name="EuTernaryFpu1Instruction"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes/Instructions"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_send_active"
+             units="percent"
+             symbol_name="EuSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x166C0760" />
+        <register type="NOA" address="0x00009888" value="0x1593001E" />
+        <register type="NOA" address="0x00009888" value="0x3F900003" />
+        <register type="NOA" address="0x00009888" value="0x004E8000" />
+        <register type="NOA" address="0x00009888" value="0x0E4E8000" />
+        <register type="NOA" address="0x00009888" value="0x184E8000" />
+        <register type="NOA" address="0x00009888" value="0x1A4E8020" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x006C0051" />
+        <register type="NOA" address="0x00009888" value="0x066C5000" />
+        <register type="NOA" address="0x00009888" value="0x086C5C5D" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5E5F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x186C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x001B4000" />
+        <register type="NOA" address="0x00009888" value="0x061B8000" />
+        <register type="NOA" address="0x00009888" value="0x081BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x101C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1CE000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C0030" />
+        <register type="NOA" address="0x00009888" value="0x004C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C2A00" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0280" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F1500" />
+        <register type="NOA" address="0x00009888" value="0x100F0140" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162C0A00" />
+        <register type="NOA" address="0x00009888" value="0x182C00A0" />
+        <register type="NOA" address="0x00009888" value="0x03933300" />
+        <register type="NOA" address="0x00009888" value="0x05930032" />
+        <register type="NOA" address="0x00009888" value="0x11930000" />
+        <register type="NOA" address="0x00009888" value="0x1B930000" />
+        <register type="NOA" address="0x00009888" value="0x1D900157" />
+        <register type="NOA" address="0x00009888" value="0x1F900158" />
+        <register type="NOA" address="0x00009888" value="0x35900000" />
+        <register type="NOA" address="0x00009888" value="0x19908000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1190030F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900021" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900000" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x53905555" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x0007FFFA" />
+        <register type="OA" address="0x00002774" value="0x0000FEFE" />
+        <register type="OA" address="0x00002778" value="0x0007FFFA" />
+        <register type="OA" address="0x0000277C" value="0x0000FEFD" />
+        <register type="OA" address="0x00002790" value="0x0007FFFA" />
+        <register type="OA" address="0x00002794" value="0x0000FBEF" />
+        <register type="OA" address="0x00002798" value="0x0007FFFA" />
+        <register type="OA" address="0x0000279C" value="0x0000FBDF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00000003" />
+        <register type="FLEX" address="0x0000E658" value="0x00002001" />
+        <register type="FLEX" address="0x0000E758" value="0x00101100" />
+        <register type="FLEX" address="0x0000E45C" value="0x00201200" />
+        <register type="FLEX" address="0x0000E55C" value="0x00301300" />
+        <register type="FLEX" address="0x0000E65C" value="0x00401400" />
+    </register_config>
+  </set>
+
+  <set name="Metric set HDCAndSF"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="hdc_and_sf"
+       hw_config_guid="75f56991-b149-4122-ade9-d9c0c80c733b"
+       chipset="SKLGT4"
+       symbol_name="HDCAndSF"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Polygon Data Ready"
+             description="The percentage of time in which geometry pipeline output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="poly_data_ready"
+             units="percent"
+             symbol_name="PolyDataReady"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe/Strip-Fans"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="HDC stalled by L3 (s0.ss1)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss1)"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ C 4 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader01_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader01AccessStalledOnL3"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss2)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss2)"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ C 2 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader02_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader02AccessStalledOnL3"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="HDC stalled by L3 (s0.ss0)"
+             description="Percentage of time when HDC has messges to L3, but it's stalled due to lack of credits (s0.ss0)"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ C 6 READ USUB 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_sampler_shader00_access_stalled_on_l3"
+             units="percent"
+             symbol_name="NonSamplerShader00AccessStalledOnL3"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="GPU/Data Port"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x104F0232" />
+        <register type="NOA" address="0x00009888" value="0x124F4640" />
+        <register type="NOA" address="0x00009888" value="0x106C0232" />
+        <register type="NOA" address="0x00009888" value="0x11834400" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x004F1880" />
+        <register type="NOA" address="0x00009888" value="0x024F08BB" />
+        <register type="NOA" address="0x00009888" value="0x044F001B" />
+        <register type="NOA" address="0x00009888" value="0x046C0100" />
+        <register type="NOA" address="0x00009888" value="0x066C000B" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x041B8000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x005B8000" />
+        <register type="NOA" address="0x00009888" value="0x025BC000" />
+        <register type="NOA" address="0x00009888" value="0x045B4000" />
+        <register type="NOA" address="0x00009888" value="0x125C8000" />
+        <register type="NOA" address="0x00009888" value="0x145C8000" />
+        <register type="NOA" address="0x00009888" value="0x165C8000" />
+        <register type="NOA" address="0x00009888" value="0x185C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00A0" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x022CC000" />
+        <register type="NOA" address="0x00009888" value="0x042CC000" />
+        <register type="NOA" address="0x00009888" value="0x062CC000" />
+        <register type="NOA" address="0x00009888" value="0x082CC000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0F828000" />
+        <register type="NOA" address="0x00009888" value="0x0F8305C0" />
+        <register type="NOA" address="0x00009888" value="0x09830000" />
+        <register type="NOA" address="0x00009888" value="0x07830000" />
+        <register type="NOA" address="0x00009888" value="0x1D950080" />
+        <register type="NOA" address="0x00009888" value="0x13928000" />
+        <register type="NOA" address="0x00009888" value="0x0F988000" />
+        <register type="NOA" address="0x00009888" value="0x31904000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x59900001" />
+        <register type="NOA" address="0x00009888" value="0x4B900040" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000FDFF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_1"
+       hw_config_guid="0d4cda70-da83-466f-b61e-7a064fe6a232"
+       chipset="SKLGT4"
+       symbol_name="L3_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank1 Active"
+             description="The percentage of time in which slice0 L3 bank1 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_active"
+             units="percent"
+             symbol_name="L30Bank1Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 L3 Bank1 Stalled"
+             description="The percentage of time in which slice0 L3 bank1 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank1_stalled"
+             units="percent"
+             symbol_name="L30Bank1Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Active"
+             description="The percentage of time in which slice0 L3 bank0 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_active"
+             units="percent"
+             symbol_name="L30Bank0Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank0 Stalled"
+             description="The percentage of time in which slice0 L3 bank0 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank0_stalled"
+             units="percent"
+             symbol_name="L30Bank0Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C7B40" />
+        <register type="NOA" address="0x00009888" value="0x166C0020" />
+        <register type="NOA" address="0x00009888" value="0x0A603444" />
+        <register type="NOA" address="0x00009888" value="0x0A613400" />
+        <register type="NOA" address="0x00009888" value="0x1A4EA800" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0002" />
+        <register type="NOA" address="0x00009888" value="0x024E8000" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C6C5327" />
+        <register type="NOA" address="0x00009888" value="0x0E6C5425" />
+        <register type="NOA" address="0x00009888" value="0x006C2A00" />
+        <register type="NOA" address="0x00009888" value="0x026C285B" />
+        <register type="NOA" address="0x00009888" value="0x046C005C" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1C6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1E6C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0800" />
+        <register type="NOA" address="0x00009888" value="0x0C1BC000" />
+        <register type="NOA" address="0x00009888" value="0x0E1BC000" />
+        <register type="NOA" address="0x00009888" value="0x001B8000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x1C1C003C" />
+        <register type="NOA" address="0x00009888" value="0x121C8000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x10600000" />
+        <register type="NOA" address="0x00009888" value="0x04600000" />
+        <register type="NOA" address="0x00009888" value="0x0C610044" />
+        <register type="NOA" address="0x00009888" value="0x10610000" />
+        <register type="NOA" address="0x00009888" value="0x06610000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A8" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0154" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x182C00AA" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190FFC0" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900420" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900021" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900400" />
+        <register type="NOA" address="0x00009888" value="0x43900421" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00014002" />
+        <register type="OA" address="0x0000277C" value="0x0000C3FF" />
+        <register type="OA" address="0x00002780" value="0x00010002" />
+        <register type="OA" address="0x00002784" value="0x0000C7FF" />
+        <register type="OA" address="0x00002788" value="0x00004002" />
+        <register type="OA" address="0x0000278C" value="0x0000D3FF" />
+        <register type="OA" address="0x00002790" value="0x00100700" />
+        <register type="OA" address="0x00002794" value="0x0000FF1F" />
+        <register type="OA" address="0x00002798" value="0x00001402" />
+        <register type="OA" address="0x0000279C" value="0x0000FC3F" />
+        <register type="OA" address="0x000027A0" value="0x00001002" />
+        <register type="OA" address="0x000027A4" value="0x0000FC7F" />
+        <register type="OA" address="0x000027A8" value="0x00000402" />
+        <register type="OA" address="0x000027AC" value="0x0000FD3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_2"
+       hw_config_guid="20137ace-b110-4341-883f-1094c820093c"
+       chipset="SKLGT4"
+       symbol_name="L3_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Stalled"
+             description="The percentage of time in which slice0 L3 bank2 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_stalled"
+             units="percent"
+             symbol_name="L30Bank2Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank2 Active"
+             description="The percentage of time in which slice0 L3 bank2 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank2_active"
+             units="percent"
+             symbol_name="L30Bank2Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C02E0" />
+        <register type="NOA" address="0x00009888" value="0x146C0001" />
+        <register type="NOA" address="0x00009888" value="0x0A623400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x064F4000" />
+        <register type="NOA" address="0x00009888" value="0x026C3324" />
+        <register type="NOA" address="0x00009888" value="0x046C3422" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C0000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C0800" />
+        <register type="NOA" address="0x00009888" value="0x065B4000" />
+        <register type="NOA" address="0x00009888" value="0x1A5C1000" />
+        <register type="NOA" address="0x00009888" value="0x06614000" />
+        <register type="NOA" address="0x00009888" value="0x0C620044" />
+        <register type="NOA" address="0x00009888" value="0x10620000" />
+        <register type="NOA" address="0x00009888" value="0x06620000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C002A" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2CC000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set L3_3"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="l3_3"
+       hw_config_guid="d3a6b05e-46ef-44a8-96c3-9bd3e58acbe6"
+       chipset="SKLGT4"
+       symbol_name="L3_3"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 L3 Bank3 Stalled"
+             description="The percentage of time in which slice0 L3 bank3 is stalled"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_stalled"
+             units="percent"
+             symbol_name="L30Bank3Stalled"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 L3 Bank3 Active"
+             description="The percentage of time in which slice0 L3 bank3 is active"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="l30_bank3_active"
+             units="percent"
+             symbol_name="L30Bank3Active"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GTI/L3"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x126C4E80" />
+        <register type="NOA" address="0x00009888" value="0x146C0000" />
+        <register type="NOA" address="0x00009888" value="0x0A633400" />
+        <register type="NOA" address="0x00009888" value="0x044E8000" />
+        <register type="NOA" address="0x00009888" value="0x064E8000" />
+        <register type="NOA" address="0x00009888" value="0x084E8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4E8000" />
+        <register type="NOA" address="0x00009888" value="0x0C4E8000" />
+        <register type="NOA" address="0x00009888" value="0x026C3321" />
+        <register type="NOA" address="0x00009888" value="0x046C342F" />
+        <register type="NOA" address="0x00009888" value="0x106C0000" />
+        <register type="NOA" address="0x00009888" value="0x1A6C2000" />
+        <register type="NOA" address="0x00009888" value="0x021BC000" />
+        <register type="NOA" address="0x00009888" value="0x041BC000" />
+        <register type="NOA" address="0x00009888" value="0x061B4000" />
+        <register type="NOA" address="0x00009888" value="0x141C8000" />
+        <register type="NOA" address="0x00009888" value="0x161C8000" />
+        <register type="NOA" address="0x00009888" value="0x181C8000" />
+        <register type="NOA" address="0x00009888" value="0x1A1C1800" />
+        <register type="NOA" address="0x00009888" value="0x06604000" />
+        <register type="NOA" address="0x00009888" value="0x0C630044" />
+        <register type="NOA" address="0x00009888" value="0x10630000" />
+        <register type="NOA" address="0x00009888" value="0x06630000" />
+        <register type="NOA" address="0x00009888" value="0x084C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C00AA" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F4000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0055" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190F800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900002" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00100070" />
+        <register type="OA" address="0x00002774" value="0x0000FFF1" />
+        <register type="OA" address="0x00002778" value="0x00028002" />
+        <register type="OA" address="0x0000277C" value="0x000087FF" />
+        <register type="OA" address="0x00002780" value="0x00020002" />
+        <register type="OA" address="0x00002784" value="0x00008FFF" />
+        <register type="OA" address="0x00002788" value="0x00008002" />
+        <register type="OA" address="0x0000278C" value="0x0000A7FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set RasterizerAndPixelBackend"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="rasterizer_and_pixel_backend"
+       hw_config_guid="4081b948-63f1-4b1a-abaa-6017cb77a63b"
+       chipset="SKLGT4"
+       symbol_name="RasterizerAndPixelBackend"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Slice0 Pixel Values Ready"
+             description="The percentage of time in which slice0 pixel values are ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_values0_ready"
+             units="percent"
+             symbol_name="PixelValues0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="Slice0 Rasterizer Input Available"
+             description="The percentage of time in which slice0 rasterizer input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_input_available"
+             units="percent"
+             symbol_name="Rasterizer0InputAvailable"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Slice0 Post-EarlyZ Pixel Data Ready"
+             description="The percentage of time in which slice0 post-EarlyZ pixel data is ready (after early Z tests have been applied)"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="pixel_data0_ready"
+             units="percent"
+             symbol_name="PixelData0Ready"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer/Early Depth Test"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Rasterizer Output Ready"
+             description="The percentage of time in which slice0 rasterizer output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="rasterizer0_output_ready"
+             units="percent"
+             symbol_name="Rasterizer0OutputReady"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Rasterizer"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Slice0 PS Output Available"
+             description="The percentage of time in which slice0 PS output is available"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_output0_available"
+             units="percent"
+             symbol_name="PSOutput0Available"
+             availability="$SliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/3D Pipe"
+             mdapi_hw_unit_type="slice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x102F3800" />
+        <register type="NOA" address="0x00009888" value="0x144D0500" />
+        <register type="NOA" address="0x00009888" value="0x120D03C0" />
+        <register type="NOA" address="0x00009888" value="0x140D03CF" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0004" />
+        <register type="NOA" address="0x00009888" value="0x0C4E4000" />
+        <register type="NOA" address="0x00009888" value="0x042F0480" />
+        <register type="NOA" address="0x00009888" value="0x082F0000" />
+        <register type="NOA" address="0x00009888" value="0x022F0000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0090" />
+        <register type="NOA" address="0x00009888" value="0x064D0027" />
+        <register type="NOA" address="0x00009888" value="0x004D0000" />
+        <register type="NOA" address="0x00009888" value="0x000D0D40" />
+        <register type="NOA" address="0x00009888" value="0x020D803F" />
+        <register type="NOA" address="0x00009888" value="0x040D8023" />
+        <register type="NOA" address="0x00009888" value="0x100D0000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x020F0010" />
+        <register type="NOA" address="0x00009888" value="0x000F0000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0050" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41901400" />
+        <register type="NOA" address="0x00009888" value="0x43901485" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900001" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x0000EFFF" />
+        <register type="OA" address="0x00002778" value="0x00006000" />
+        <register type="OA" address="0x0000277C" value="0x0000F3FF" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set Sampler"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="sampler"
+       hw_config_guid="eae6bbb1-0e2b-478d-bd9e-f10ded2178f9"
+       chipset="SKLGT4"
+       symbol_name="Sampler"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice2 Input Available"
+             description="The percentage of time in which slice0 subslice2 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_input_available"
+             units="percent"
+             symbol_name="Sampler02InputAvailable"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Slice0 Subslice0 Input Available"
+             description="The percentage of time in which slice0 subslice0 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_input_available"
+             units="percent"
+             symbol_name="Sampler00InputAvailable"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="Slice0 Subslice2 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice2 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler02_output_ready"
+             units="percent"
+             symbol_name="Sampler02OutputReady"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Slice0 Subslice1 Input Available"
+             description="The percentage of time in which slice0 subslice1 sampler input is available"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_input_available"
+             units="percent"
+             symbol_name="Sampler01InputAvailable"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Slice0 Subslice0 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice0 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler00_output_ready"
+             units="percent"
+             symbol_name="Sampler00OutputReady"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Slice0 Subslice1 Sampler Output Ready"
+             description="The percentage of time in which slice0 subslice1 sampler output is ready"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="sampler01_output_ready"
+             units="percent"
+             symbol_name="Sampler01OutputReady"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Sampler"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x14152C00" />
+        <register type="NOA" address="0x00009888" value="0x16150005" />
+        <register type="NOA" address="0x00009888" value="0x121600A0" />
+        <register type="NOA" address="0x00009888" value="0x14352C00" />
+        <register type="NOA" address="0x00009888" value="0x16350005" />
+        <register type="NOA" address="0x00009888" value="0x123600A0" />
+        <register type="NOA" address="0x00009888" value="0x14552C00" />
+        <register type="NOA" address="0x00009888" value="0x16550005" />
+        <register type="NOA" address="0x00009888" value="0x125600A0" />
+        <register type="NOA" address="0x00009888" value="0x062F6000" />
+        <register type="NOA" address="0x00009888" value="0x022F2000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C0050" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0010" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0350" />
+        <register type="NOA" address="0x00009888" value="0x0C0FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F00DA" />
+        <register type="NOA" address="0x00009888" value="0x182C0028" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x022DC000" />
+        <register type="NOA" address="0x00009888" value="0x042D4000" />
+        <register type="NOA" address="0x00009888" value="0x0C138000" />
+        <register type="NOA" address="0x00009888" value="0x0E132000" />
+        <register type="NOA" address="0x00009888" value="0x0413C000" />
+        <register type="NOA" address="0x00009888" value="0x1C140018" />
+        <register type="NOA" address="0x00009888" value="0x0C157000" />
+        <register type="NOA" address="0x00009888" value="0x0E150078" />
+        <register type="NOA" address="0x00009888" value="0x10150000" />
+        <register type="NOA" address="0x00009888" value="0x04162180" />
+        <register type="NOA" address="0x00009888" value="0x02160000" />
+        <register type="NOA" address="0x00009888" value="0x04174000" />
+        <register type="NOA" address="0x00009888" value="0x0233A000" />
+        <register type="NOA" address="0x00009888" value="0x04333000" />
+        <register type="NOA" address="0x00009888" value="0x14348000" />
+        <register type="NOA" address="0x00009888" value="0x16348000" />
+        <register type="NOA" address="0x00009888" value="0x02357870" />
+        <register type="NOA" address="0x00009888" value="0x10350000" />
+        <register type="NOA" address="0x00009888" value="0x04360043" />
+        <register type="NOA" address="0x00009888" value="0x02360000" />
+        <register type="NOA" address="0x00009888" value="0x04371000" />
+        <register type="NOA" address="0x00009888" value="0x0E538000" />
+        <register type="NOA" address="0x00009888" value="0x00538000" />
+        <register type="NOA" address="0x00009888" value="0x06533000" />
+        <register type="NOA" address="0x00009888" value="0x1C540020" />
+        <register type="NOA" address="0x00009888" value="0x12548000" />
+        <register type="NOA" address="0x00009888" value="0x0E557000" />
+        <register type="NOA" address="0x00009888" value="0x00557800" />
+        <register type="NOA" address="0x00009888" value="0x10550000" />
+        <register type="NOA" address="0x00009888" value="0x06560043" />
+        <register type="NOA" address="0x00009888" value="0x02560000" />
+        <register type="NOA" address="0x00009888" value="0x06571000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900060" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900842" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900060" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x70800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0000C000" />
+        <register type="OA" address="0x00002774" value="0x0000E7FF" />
+        <register type="OA" address="0x00002778" value="0x00003000" />
+        <register type="OA" address="0x0000277C" value="0x0000F9FF" />
+        <register type="OA" address="0x00002780" value="0x00000C00" />
+        <register type="OA" address="0x00002784" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_1"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_1"
+       hw_config_guid="1bba4bd2-81d4-45ec-847f-bc363e17e14d"
+       chipset="SKLGT4"
+       symbol_name="TDL_1"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice0"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice0 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 1 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread00_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread00ReadyForDispatch"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="PS Thread Ready For Dispatch on Slice0 Subslice2"
+             description="The percentage of time in which PS thread is ready for dispatch on slice0 subslice2 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_thread02_ready_for_dispatch"
+             units="percent"
+             symbol_name="PSThread02ReadyForDispatch"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="NonPS Thread Ready For Dispatch on Slice0 Subslice1"
+             description="The percentage of time in which non-PS thread is ready for dispatch on slice0 subslice1 thread dispatcher"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="non_ps_thread01_ready_for_dispatch"
+             units="percent"
+             symbol_name="NonPSThread01ReadyForDispatch"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12120000" />
+        <register type="NOA" address="0x00009888" value="0x12320000" />
+        <register type="NOA" address="0x00009888" value="0x12520000" />
+        <register type="NOA" address="0x00009888" value="0x002F8000" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0015" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F03A0" />
+        <register type="NOA" address="0x00009888" value="0x0C0FF000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0095" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2D4000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x02108000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x02118000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x02121880" />
+        <register type="NOA" address="0x00009888" value="0x041219B5" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x02134000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x0C308000" />
+        <register type="NOA" address="0x00009888" value="0x0E304000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x0C318000" />
+        <register type="NOA" address="0x00009888" value="0x0E314000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x0C321A80" />
+        <register type="NOA" address="0x00009888" value="0x0E320033" />
+        <register type="NOA" address="0x00009888" value="0x06320031" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x0C334000" />
+        <register type="NOA" address="0x00009888" value="0x0E331000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0E508000" />
+        <register type="NOA" address="0x00009888" value="0x00508000" />
+        <register type="NOA" address="0x00009888" value="0x02504000" />
+        <register type="NOA" address="0x00009888" value="0x0E518000" />
+        <register type="NOA" address="0x00009888" value="0x00518000" />
+        <register type="NOA" address="0x00009888" value="0x02514000" />
+        <register type="NOA" address="0x00009888" value="0x0E521880" />
+        <register type="NOA" address="0x00009888" value="0x00521A80" />
+        <register type="NOA" address="0x00009888" value="0x02520033" />
+        <register type="NOA" address="0x00009888" value="0x0E534000" />
+        <register type="NOA" address="0x00009888" value="0x00534000" />
+        <register type="NOA" address="0x00009888" value="0x02531000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900800" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900062" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900C00" />
+        <register type="NOA" address="0x00009888" value="0x43900003" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00000002" />
+        <register type="OA" address="0x00002774" value="0x00007FFF" />
+        <register type="OA" address="0x00002778" value="0x00000000" />
+        <register type="OA" address="0x0000277C" value="0x00009FFF" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000EFFF" />
+        <register type="OA" address="0x00002788" value="0x00000000" />
+        <register type="OA" address="0x0000278C" value="0x0000F3FF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FDFF" />
+        <register type="OA" address="0x00002798" value="0x00000000" />
+        <register type="OA" address="0x0000279C" value="0x0000FE7F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Metric set TDL_2"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="tdl_2"
+       hw_config_guid="a4b3106c-cfec-49f5-8e26-470470379e66"
+       chipset="SKLGT4"
+       symbol_name="TDL_2"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="SQ is full"
+             description="The percentage of time when SQ is filled above a threshold (usually 48 entries)"
+             data_type="float"
+             max_equation="100"
+             equation="PERFCNT1 READ_REG 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gt_request_queue_full"
+             units="percent"
+             symbol_name="GTRequestQueueFull"
+             availability="true $QueryMode &&"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL4 OCL"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="GTI"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Send Pipe Active"
+             description="The percentage of time in which EU send pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 12 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_send_active"
+             units="percent"
+             symbol_name="VsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 11 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu1_active"
+             units="percent"
+             symbol_name="VsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GS Threads Dispatched"
+             description="The total number of geometry shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 5 READ"
+             underscore_name="gs_threads"
+             units="threads"
+             symbol_name="GsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Geometry Shader"
+             />
+    <counter name="Early Hi-Depth Test Fails"
+             description="The total number of pixels dropped on early hierarchical depth test."
+             data_type="uint64"
+             equation="A 22 READ 4 UMUL"
+             underscore_name="hi_depth_test_fails"
+             units="pixels"
+             symbol_name="HiDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Hi-Depth Test"
+             />
+    <counter name="FS Both FPU Active"
+             description="The percentage of time in which fragment shaders were processed actively on the both FPUs."
+             data_type="float"
+             max_equation="100"
+             equation="A 18 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_eu_both_fpu_active"
+             units="percent"
+             symbol_name="PsEuBothFpuActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Frame Batch Draw"
+             mdapi_group="3D Pipe/Fragment Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS Threads Dispatched"
+             description="The total number of vertex shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 1 READ"
+             underscore_name="vs_threads"
+             units="threads"
+             symbol_name="VsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Vertex Shader"
+             />
+    <counter name="FS Threads Dispatched"
+             description="The total number of fragment shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 6 READ"
+             underscore_name="ps_threads"
+             units="threads"
+             symbol_name="PsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Fragment Shader"
+             />
+    <counter name="Shader Barrier Messages"
+             description="The total number of shader barrier messages."
+             data_type="uint64"
+             equation="A 35 READ"
+             underscore_name="shader_barriers"
+             units="messages"
+             symbol_name="ShaderBarriers"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Barrier"
+             />
+    <counter name="Sampler Texels"
+             description="The total number of texels seen on input (with 2x2 accuracy) in all sampler units."
+             data_type="uint64"
+             equation="A 28 READ 4 UMUL"
+             underscore_name="sampler_texels"
+             units="texels"
+             symbol_name="SamplerTexels"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Input"
+             />
+    <counter name="Pixels Failing Tests"
+             description="The total number of pixels dropped on post-FS alpha, stencil, or depth tests."
+             data_type="uint64"
+             equation="A 25 READ 4 UMUL"
+             underscore_name="pixels_failing_post_ps_tests"
+             units="pixels"
+             symbol_name="PixelsFailingPostPsTests"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort0"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice1 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice1 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 2 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header01_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader01ReadyPort1"
+             availability="$SubsliceMask 0x2 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Sampler Texels Misses"
+             description="The total number of texels lookups (with 2x2 accuracy) that missed L1 sampler cache."
+             data_type="uint64"
+             equation="A 29 READ 4 UMUL"
+             underscore_name="sampler_texel_misses"
+             units="texels"
+             symbol_name="SamplerTexelMisses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Batch Frame Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="Sampler/Sampler Cache"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="SLM Bytes Read"
+             description="The total number of GPU memory bytes read from shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ 64 UMUL"
+             underscore_name="slm_bytes_read"
+             units="bytes"
+             symbol_name="SlmBytesRead"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 16 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu1_active"
+             units="percent"
+             symbol_name="PsFpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="PS Send Pipeline Active"
+             description="The percentage of time in which EU send pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 17 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_send_active"
+             units="percent"
+             symbol_name="PsSendActive"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a vertex shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 10 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vs_fpu0_active"
+             units="percent"
+             symbol_name="VsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Vertex Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort1"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice2 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice2 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header02_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader02ReadyPort0"
+             availability="$SubsliceMask 0x4 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Rasterized Pixels"
+             description="The total number of rasterized pixels."
+             data_type="uint64"
+             equation="A 21 READ 4 UMUL"
+             underscore_name="rasterized_pixels"
+             units="pixels"
+             symbol_name="RasterizedPixels"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer"
+             />
+    <counter name="PS FPU0 Pipe Active"
+             description="The percentage of time in which EU FPU0 pipeline was actively processing a pixel shader instruction."
+             data_type="float"
+             max_equation="100"
+             equation="A 15 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="ps_fpu0_active"
+             units="percent"
+             symbol_name="PsFpu0Active"
+             semantic_type="duration"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pixel Shader"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="DS Threads Dispatched"
+             description="The total number of domain shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 3 READ"
+             underscore_name="ds_threads"
+             units="threads"
+             symbol_name="DsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Domain Shader"
+             />
+    <counter name="Samples Written"
+             description="The total number of samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 26 READ 4 UMUL"
+             underscore_name="samples_written"
+             units="pixels"
+             symbol_name="SamplesWritten"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Blended"
+             description="The total number of blended samples or pixels written to all render targets."
+             data_type="uint64"
+             equation="A 27 READ 4 UMUL"
+             underscore_name="samples_blended"
+             units="pixels"
+             symbol_name="SamplesBlended"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Output Merger"
+             />
+    <counter name="Early Depth Test Fails"
+             description="The total number of pixels dropped on early depth test."
+             data_type="uint64"
+             equation="A 23 READ 4 UMUL"
+             underscore_name="early_depth_test_fails"
+             units="pixels"
+             symbol_name="EarlyDepthTestFails"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Rasterizer/Early Depth Test"
+             />
+    <counter name="Shader Memory Accesses"
+             description="The total number of shader memory accesses to L3."
+             data_type="uint64"
+             equation="A 32 READ"
+             underscore_name="shader_memory_accesses"
+             units="messages"
+             symbol_name="ShaderMemoryAccesses"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port"
+             />
+    <counter name="HS Threads Dispatched"
+             description="The total number of hull shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 2 READ"
+             underscore_name="hs_threads"
+             units="threads"
+             symbol_name="HsThreads"
+             semantic_type="event"
+             mdapi_supported_apis="OGL4 IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Hull Shader"
+             />
+    <counter name="SLM Bytes Written"
+             description="The total number of GPU memory bytes written into shared local memory."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 31 READ 64 UMUL"
+             underscore_name="slm_bytes_written"
+             units="bytes"
+             symbol_name="SlmBytesWritten"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_group="L3/Data Port/SLM"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="L3 Shader Throughput"
+             description="The total number of GPU memory bytes transferred between shaders and L3 caches w/o URB."
+             data_type="uint64"
+             max_equation="$GpuCoreClocks 64 UMUL $EuSubslicesTotalCount UMUL"
+             equation="A 30 READ  A 31 READ $ShaderMemoryAccesses 64 UMUL UADD UADD"
+             underscore_name="l3_shader_throughput"
+             units="bytes"
+             symbol_name="L3ShaderThroughput"
+             semantic_type="throughput"
+             mdapi_supported_apis="OGL4 OCL IO BB"
+             mdapi_usage_flags="Tier2 Frame Batch Draw"
+             mdapi_group="L3/Data Port"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Samples Killed in FS"
+             description="The total number of samples or pixels dropped in fragment shaders."
+             data_type="uint64"
+             equation="A 24 READ 4 UMUL"
+             underscore_name="samples_killed_in_ps"
+             units="pixels"
+             symbol_name="SamplesKilledInPs"
+             semantic_type="event"
+             mdapi_supported_apis="OGL IO BB"
+             mdapi_usage_flags="Tier4 Overview Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="3D Pipe/Fragment Shader"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 0"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 0"
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port0"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort0"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <counter name="Shader Atomic Memory Accesses"
+             description="The total number of shader atomic memory accesses."
+             data_type="uint64"
+             equation="A 34 READ"
+             underscore_name="shader_atomics"
+             units="messages"
+             symbol_name="ShaderAtomics"
+             semantic_type="event"
+             mdapi_supported_apis="OGL OCL IO BB"
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="L3/Data Port/Atomics"
+             />
+    <counter name="Thread Header Ready on Slice0 Subslice0 Port 1"
+             description="The percentage of time in which thread header is ready on slice0 subslice0 thread dispatcher port 1"
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="thread_header00_ready_port1"
+             units="percent"
+             symbol_name="ThreadHeader00ReadyPort1"
+             availability="$SubsliceMask 0x1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview Frame Batch Draw"
+             mdapi_group="GPU/Thread Dispatcher"
+             mdapi_hw_unit_type="subslice"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x000091BC" value="0xE0500000" />
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x12124D60" />
+        <register type="NOA" address="0x00009888" value="0x12322E60" />
+        <register type="NOA" address="0x00009888" value="0x12524D60" />
+        <register type="NOA" address="0x00009888" value="0x022F3000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0014" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x0C0FE000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F0097" />
+        <register type="NOA" address="0x00009888" value="0x082C8000" />
+        <register type="NOA" address="0x00009888" value="0x0A2C8000" />
+        <register type="NOA" address="0x00009888" value="0x002D8000" />
+        <register type="NOA" address="0x00009888" value="0x062D4000" />
+        <register type="NOA" address="0x00009888" value="0x0410C000" />
+        <register type="NOA" address="0x00009888" value="0x0411C000" />
+        <register type="NOA" address="0x00009888" value="0x04121FB7" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x04135000" />
+        <register type="NOA" address="0x00009888" value="0x00308000" />
+        <register type="NOA" address="0x00009888" value="0x06304000" />
+        <register type="NOA" address="0x00009888" value="0x00318000" />
+        <register type="NOA" address="0x00009888" value="0x06314000" />
+        <register type="NOA" address="0x00009888" value="0x00321B80" />
+        <register type="NOA" address="0x00009888" value="0x0632003F" />
+        <register type="NOA" address="0x00009888" value="0x00334000" />
+        <register type="NOA" address="0x00009888" value="0x06331000" />
+        <register type="NOA" address="0x00009888" value="0x0250C000" />
+        <register type="NOA" address="0x00009888" value="0x0251C000" />
+        <register type="NOA" address="0x00009888" value="0x02521FB7" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x02535000" />
+        <register type="NOA" address="0x00009888" value="0x1190FC00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900800" />
+        <register type="NOA" address="0x00009888" value="0x43900063" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x00800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00010003" />
+        <register type="FLEX" address="0x0000E658" value="0x00012011" />
+        <register type="FLEX" address="0x0000E758" value="0x00015014" />
+        <register type="FLEX" address="0x0000E45C" value="0x00051050" />
+        <register type="FLEX" address="0x0000E55C" value="0x00053052" />
+        <register type="FLEX" address="0x0000E65C" value="0x00055054" />
+    </register_config>
+  </set>
+
+  <set name="Compute Metrics Extra Gen9"
+       mdapi_supported_apis="OGL4 OCL IO BB"
+       underscore_name="compute_extra"
+       hw_config_guid="a5aa857d-e8f0-4dfa-8981-ce340fa748fd"
+       chipset="SKLGT4"
+       symbol_name="ComputeExtra"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU FPU1 Pipe Active"
+             description="The percentage of time in which EU FPU1 pipeline was actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="fpu1_active"
+             units="percent"
+             symbol_name="Fpu1Active"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x121203E0" />
+        <register type="NOA" address="0x00009888" value="0x123203E0" />
+        <register type="NOA" address="0x00009888" value="0x125203E0" />
+        <register type="NOA" address="0x00009888" value="0x129203E0" />
+        <register type="NOA" address="0x00009888" value="0x12B203E0" />
+        <register type="NOA" address="0x00009888" value="0x12D203E0" />
+        <register type="NOA" address="0x00009888" value="0x131203E0" />
+        <register type="NOA" address="0x00009888" value="0x133203E0" />
+        <register type="NOA" address="0x00009888" value="0x135203E0" />
+        <register type="NOA" address="0x00009888" value="0x1A4EF000" />
+        <register type="NOA" address="0x00009888" value="0x1C4E0003" />
+        <register type="NOA" address="0x00009888" value="0x024EC000" />
+        <register type="NOA" address="0x00009888" value="0x044EC000" />
+        <register type="NOA" address="0x00009888" value="0x064EC000" />
+        <register type="NOA" address="0x00009888" value="0x022F4000" />
+        <register type="NOA" address="0x00009888" value="0x0C4C02A0" />
+        <register type="NOA" address="0x00009888" value="0x084CA000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C0042" />
+        <register type="NOA" address="0x00009888" value="0x0C0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E0DA000" />
+        <register type="NOA" address="0x00009888" value="0x000D8000" />
+        <register type="NOA" address="0x00009888" value="0x020DA000" />
+        <register type="NOA" address="0x00009888" value="0x040DA000" />
+        <register type="NOA" address="0x00009888" value="0x060D2000" />
+        <register type="NOA" address="0x00009888" value="0x100F0150" />
+        <register type="NOA" address="0x00009888" value="0x0C0F5000" />
+        <register type="NOA" address="0x00009888" value="0x0E0F006D" />
+        <register type="NOA" address="0x00009888" value="0x182C00A8" />
+        <register type="NOA" address="0x00009888" value="0x022C8000" />
+        <register type="NOA" address="0x00009888" value="0x042C8000" />
+        <register type="NOA" address="0x00009888" value="0x062C8000" />
+        <register type="NOA" address="0x00009888" value="0x0C2C8000" />
+        <register type="NOA" address="0x00009888" value="0x042D8000" />
+        <register type="NOA" address="0x00009888" value="0x06104000" />
+        <register type="NOA" address="0x00009888" value="0x06114000" />
+        <register type="NOA" address="0x00009888" value="0x06120033" />
+        <register type="NOA" address="0x00009888" value="0x00120000" />
+        <register type="NOA" address="0x00009888" value="0x06131000" />
+        <register type="NOA" address="0x00009888" value="0x04308000" />
+        <register type="NOA" address="0x00009888" value="0x04318000" />
+        <register type="NOA" address="0x00009888" value="0x04321980" />
+        <register type="NOA" address="0x00009888" value="0x00320000" />
+        <register type="NOA" address="0x00009888" value="0x04334000" />
+        <register type="NOA" address="0x00009888" value="0x04504000" />
+        <register type="NOA" address="0x00009888" value="0x04514000" />
+        <register type="NOA" address="0x00009888" value="0x04520033" />
+        <register type="NOA" address="0x00009888" value="0x00520000" />
+        <register type="NOA" address="0x00009888" value="0x04531000" />
+        <register type="NOA" address="0x00009888" value="0x1ACEF000" />
+        <register type="NOA" address="0x00009888" value="0x1CCE0003" />
+        <register type="NOA" address="0x00009888" value="0x00AF8000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC02A0" />
+        <register type="NOA" address="0x00009888" value="0x0ACC0001" />
+        <register type="NOA" address="0x00009888" value="0x0C8D8000" />
+        <register type="NOA" address="0x00009888" value="0x0E8DA000" />
+        <register type="NOA" address="0x00009888" value="0x008D8000" />
+        <register type="NOA" address="0x00009888" value="0x028DA000" />
+        <register type="NOA" address="0x00009888" value="0x108F0150" />
+        <register type="NOA" address="0x00009888" value="0x0C8FB000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F0001" />
+        <register type="NOA" address="0x00009888" value="0x18AC00A8" />
+        <register type="NOA" address="0x00009888" value="0x06AC8000" />
+        <register type="NOA" address="0x00009888" value="0x02AD4000" />
+        <register type="NOA" address="0x00009888" value="0x02908000" />
+        <register type="NOA" address="0x00009888" value="0x02918000" />
+        <register type="NOA" address="0x00009888" value="0x02921980" />
+        <register type="NOA" address="0x00009888" value="0x00920000" />
+        <register type="NOA" address="0x00009888" value="0x02934000" />
+        <register type="NOA" address="0x00009888" value="0x02B04000" />
+        <register type="NOA" address="0x00009888" value="0x02B14000" />
+        <register type="NOA" address="0x00009888" value="0x02B20033" />
+        <register type="NOA" address="0x00009888" value="0x00B20000" />
+        <register type="NOA" address="0x00009888" value="0x02B31000" />
+        <register type="NOA" address="0x00009888" value="0x00D08000" />
+        <register type="NOA" address="0x00009888" value="0x00D18000" />
+        <register type="NOA" address="0x00009888" value="0x00D21980" />
+        <register type="NOA" address="0x00009888" value="0x00D34000" />
+        <register type="NOA" address="0x00009888" value="0x072F8000" />
+        <register type="NOA" address="0x00009888" value="0x0D4C0100" />
+        <register type="NOA" address="0x00009888" value="0x0D0D8000" />
+        <register type="NOA" address="0x00009888" value="0x0F0DA000" />
+        <register type="NOA" address="0x00009888" value="0x110F01B0" />
+        <register type="NOA" address="0x00009888" value="0x192C0080" />
+        <register type="NOA" address="0x00009888" value="0x0F2D4000" />
+        <register type="NOA" address="0x00009888" value="0x0F108000" />
+        <register type="NOA" address="0x00009888" value="0x0F118000" />
+        <register type="NOA" address="0x00009888" value="0x0F121980" />
+        <register type="NOA" address="0x00009888" value="0x01120000" />
+        <register type="NOA" address="0x00009888" value="0x0F134000" />
+        <register type="NOA" address="0x00009888" value="0x0F304000" />
+        <register type="NOA" address="0x00009888" value="0x0F314000" />
+        <register type="NOA" address="0x00009888" value="0x0F320033" />
+        <register type="NOA" address="0x00009888" value="0x01320000" />
+        <register type="NOA" address="0x00009888" value="0x0F331000" />
+        <register type="NOA" address="0x00009888" value="0x0D508000" />
+        <register type="NOA" address="0x00009888" value="0x0D518000" />
+        <register type="NOA" address="0x00009888" value="0x0D521980" />
+        <register type="NOA" address="0x00009888" value="0x01520000" />
+        <register type="NOA" address="0x00009888" value="0x0D534000" />
+        <register type="NOA" address="0x00009888" value="0x1190FF80" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900C00" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+        <register type="NOA" address="0x00009888" value="0x4B900002" />
+        <register type="NOA" address="0x00009888" value="0x59900000" />
+        <register type="NOA" address="0x00009888" value="0x51901100" />
+        <register type="NOA" address="0x00009888" value="0x41901000" />
+        <register type="NOA" address="0x00009888" value="0x43901423" />
+        <register type="NOA" address="0x00009888" value="0x53903331" />
+        <register type="NOA" address="0x00009888" value="0x45900044" />
+    </register_config>
+  </set>
+
+  <set name="Media Vme Pipe Gen9"
+       mdapi_supported_apis="MEDIA IO BB"
+       underscore_name="vme_pipe"
+       hw_config_guid="0e8d8b86-4ee7-4cdd-aaaa-58adc92cb29e"
+       chipset="SKLGT4"
+       symbol_name="VMEPipe"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="EU Active"
+             description="The percentage of time in which the Execution Units were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 7 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_active"
+             units="percent"
+             symbol_name="EuActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Both FPU Pipes Active"
+             description="The percentage of time in which both EU FPU pipelines were actively processing."
+             data_type="float"
+             max_equation="100"
+             equation="A 9 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_fpu_both_active"
+             units="percent"
+             symbol_name="EuFpuBothActive"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Overview System Frame Batch Draw"
+             mdapi_group="EU Array/Pipes"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="CS Threads Dispatched"
+             description="The total number of compute shader hardware threads dispatched."
+             data_type="uint64"
+             equation="A 4 READ"
+             underscore_name="cs_threads"
+             units="threads"
+             symbol_name="CsThreads"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier3 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="EU Array/Compute Shader"
+             />
+    <counter name="EU Thread Occupancy"
+             description="The percentage of time in which hardware threads occupied EUs."
+             data_type="float"
+             max_equation="100"
+             equation="8 A 10 READ FMUL $EuThreadsCount FDIV $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_thread_occupancy"
+             units="percent"
+             symbol_name="EuThreadOccupancy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="EU Stall"
+             description="The percentage of time in which the Execution Units were stalled."
+             data_type="float"
+             max_equation="100"
+             equation="A 8 READ $EuCoresTotalCount UDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="eu_stall"
+             units="percent"
+             symbol_name="EuStall"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier2 Overview System Frame Batch Draw"
+             mdapi_group="EU Array"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="VME Busy"
+             description="The percentage of time in which VME (IME or CRE) was actively processing data."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 3 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vme_busy"
+             units="percent"
+             symbol_name="VMEBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Overview System Batch Tier2"
+             mdapi_group="VME Pipe"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Busy"
+             description="The percentage of time in which the GPU has been processing GPU commands."
+             data_type="float"
+             max_equation="100"
+             equation="A 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="gpu_busy"
+             units="percent"
+             symbol_name="GpuBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x141A5800" />
+        <register type="NOA" address="0x00009888" value="0x161A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12180240" />
+        <register type="NOA" address="0x00009888" value="0x14180002" />
+        <register type="NOA" address="0x00009888" value="0x149A5800" />
+        <register type="NOA" address="0x00009888" value="0x169A00C0" />
+        <register type="NOA" address="0x00009888" value="0x12980240" />
+        <register type="NOA" address="0x00009888" value="0x14980002" />
+        <register type="NOA" address="0x00009888" value="0x1A4E3FC0" />
+        <register type="NOA" address="0x00009888" value="0x002F1000" />
+        <register type="NOA" address="0x00009888" value="0x022F8000" />
+        <register type="NOA" address="0x00009888" value="0x042F3000" />
+        <register type="NOA" address="0x00009888" value="0x004C4000" />
+        <register type="NOA" address="0x00009888" value="0x0A4C9500" />
+        <register type="NOA" address="0x00009888" value="0x0C4C002A" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0400" />
+        <register type="NOA" address="0x00009888" value="0x0E0F5500" />
+        <register type="NOA" address="0x00009888" value="0x100F0015" />
+        <register type="NOA" address="0x00009888" value="0x002C8000" />
+        <register type="NOA" address="0x00009888" value="0x0E2C8000" />
+        <register type="NOA" address="0x00009888" value="0x162CAA00" />
+        <register type="NOA" address="0x00009888" value="0x182C000A" />
+        <register type="NOA" address="0x00009888" value="0x04193000" />
+        <register type="NOA" address="0x00009888" value="0x081A28C1" />
+        <register type="NOA" address="0x00009888" value="0x001A0000" />
+        <register type="NOA" address="0x00009888" value="0x00133000" />
+        <register type="NOA" address="0x00009888" value="0x0613C000" />
+        <register type="NOA" address="0x00009888" value="0x0813F000" />
+        <register type="NOA" address="0x00009888" value="0x00172000" />
+        <register type="NOA" address="0x00009888" value="0x06178000" />
+        <register type="NOA" address="0x00009888" value="0x0817A000" />
+        <register type="NOA" address="0x00009888" value="0x00180037" />
+        <register type="NOA" address="0x00009888" value="0x06180940" />
+        <register type="NOA" address="0x00009888" value="0x08180000" />
+        <register type="NOA" address="0x00009888" value="0x02180000" />
+        <register type="NOA" address="0x00009888" value="0x04183000" />
+        <register type="NOA" address="0x00009888" value="0x04AFC000" />
+        <register type="NOA" address="0x00009888" value="0x06AF3000" />
+        <register type="NOA" address="0x00009888" value="0x0ACC4000" />
+        <register type="NOA" address="0x00009888" value="0x0CCC0015" />
+        <register type="NOA" address="0x00009888" value="0x0A8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C8DA000" />
+        <register type="NOA" address="0x00009888" value="0x0E8F4000" />
+        <register type="NOA" address="0x00009888" value="0x108F0015" />
+        <register type="NOA" address="0x00009888" value="0x16ACA000" />
+        <register type="NOA" address="0x00009888" value="0x18AC000A" />
+        <register type="NOA" address="0x00009888" value="0x06993000" />
+        <register type="NOA" address="0x00009888" value="0x0C9A28C1" />
+        <register type="NOA" address="0x00009888" value="0x009A0000" />
+        <register type="NOA" address="0x00009888" value="0x0A93F000" />
+        <register type="NOA" address="0x00009888" value="0x0C93F000" />
+        <register type="NOA" address="0x00009888" value="0x0A97A000" />
+        <register type="NOA" address="0x00009888" value="0x0C97A000" />
+        <register type="NOA" address="0x00009888" value="0x0A980977" />
+        <register type="NOA" address="0x00009888" value="0x08980000" />
+        <register type="NOA" address="0x00009888" value="0x04980000" />
+        <register type="NOA" address="0x00009888" value="0x06983000" />
+        <register type="NOA" address="0x00009888" value="0x119000FF" />
+        <register type="NOA" address="0x00009888" value="0x51900010" />
+        <register type="NOA" address="0x00009888" value="0x41900060" />
+        <register type="NOA" address="0x00009888" value="0x55900111" />
+        <register type="NOA" address="0x00009888" value="0x45900C00" />
+        <register type="NOA" address="0x00009888" value="0x47900821" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900002" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x30800000" />
+        <register type="OA" address="0x00002770" value="0x00100030" />
+        <register type="OA" address="0x00002774" value="0x0000FFF9" />
+        <register type="OA" address="0x00002778" value="0x00000002" />
+        <register type="OA" address="0x0000277C" value="0x0000FFFC" />
+        <register type="OA" address="0x00002780" value="0x00000002" />
+        <register type="OA" address="0x00002784" value="0x0000FFF3" />
+        <register type="OA" address="0x00002788" value="0x00100180" />
+        <register type="OA" address="0x0000278C" value="0x0000FFCF" />
+        <register type="OA" address="0x00002790" value="0x00000002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00000002" />
+        <register type="OA" address="0x0000279C" value="0x0000FF3F" />
+    </register_config>
+    <register_config type="FLEX">
+        <register type="FLEX" address="0x0000E458" value="0x00005004" />
+        <register type="FLEX" address="0x0000E558" value="0x00008003" />
+    </register_config>
+  </set>
+
+  <set name="Gpu Rings Busyness"
+       mdapi_supported_apis="OGL OCL MEDIA IO BB"
+       underscore_name="gpu_busyness"
+       hw_config_guid="4e5b1599-5b01-4b3d-89fa-6b26a25fe02b"
+       chipset="SKLGT4"
+       symbol_name="GpuBusyness"
+       >
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="Vebox Ring Busy"
+             description="The percentage of time when vebox command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 4 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vebox_busy"
+             units="percent"
+             symbol_name="VeboxBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Render Ring Busy"
+             description="The percentage of time when render command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 7 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="render_busy"
+             units="percent"
+             symbol_name="RenderBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox0 Ring Busy"
+             description="The percentage of time when Vdbox0 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 6 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox0_busy"
+             units="percent"
+             symbol_name="Vdbox0Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Blitter Ring Busy"
+             description="The percentage of time when blitter command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 3 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="blitter_busy"
+             units="percent"
+             symbol_name="BlitterBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AnyRingBusy"
+             description="The percentage of time when any command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="any_ring_busy"
+             units="percent"
+             symbol_name="AnyRingBusy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="Vdbox1 Ring Busy"
+             description="The percentage of time when Vdbox1 command streamer was busy."
+             data_type="float"
+             max_equation="100"
+             equation="C 5 READ 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="vdbox1_busy"
+             units="percent"
+             symbol_name="Vdbox1Busy"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="System Frame Batch"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x21D05800" />
+        <register type="NOA" address="0x00009888" value="0x13805800" />
+        <register type="NOA" address="0x00009888" value="0x05962C25" />
+        <register type="NOA" address="0x00009888" value="0x19950016" />
+        <register type="NOA" address="0x00009888" value="0x21C05800" />
+        <register type="NOA" address="0x00009888" value="0x09D000A5" />
+        <register type="NOA" address="0x00009888" value="0x11D00000" />
+        <register type="NOA" address="0x00009888" value="0x05D00000" />
+        <register type="NOA" address="0x00009888" value="0x09D54000" />
+        <register type="NOA" address="0x00009888" value="0x07800035" />
+        <register type="NOA" address="0x00009888" value="0x11800000" />
+        <register type="NOA" address="0x00009888" value="0x1D810400" />
+        <register type="NOA" address="0x00009888" value="0x21960000" />
+        <register type="NOA" address="0x00009888" value="0x0996C000" />
+        <register type="NOA" address="0x00009888" value="0x0B964000" />
+        <register type="NOA" address="0x00009888" value="0x19938000" />
+        <register type="NOA" address="0x00009888" value="0x1B930068" />
+        <register type="NOA" address="0x00009888" value="0x15948000" />
+        <register type="NOA" address="0x00009888" value="0x1B94000C" />
+        <register type="NOA" address="0x00009888" value="0x03957500" />
+        <register type="NOA" address="0x00009888" value="0x1D950000" />
+        <register type="NOA" address="0x00009888" value="0x17950000" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x07928000" />
+        <register type="NOA" address="0x00009888" value="0x03988000" />
+        <register type="NOA" address="0x00009888" value="0x17908000" />
+        <register type="NOA" address="0x00009888" value="0x19904000" />
+        <register type="NOA" address="0x00009888" value="0x1B908000" />
+        <register type="NOA" address="0x00009888" value="0x1D908000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x09978000" />
+        <register type="NOA" address="0x00009888" value="0x0BC000A5" />
+        <register type="NOA" address="0x00009888" value="0x11C00000" />
+        <register type="NOA" address="0x00009888" value="0x05C00000" />
+        <register type="NOA" address="0x00009888" value="0x0BC54000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x43900463" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900040" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x10800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x0007C000" />
+        <register type="OA" address="0x00002774" value="0x000007FF" />
+    </register_config>
+  </set>
+
+  <set name="MDAPI testing set Gen9"
+       mdapi_supported_apis="OGL OCL IO BB"
+       underscore_name="test_oa"
+       hw_config_guid="882fa433-1f4a-4a67-a962-c741888fe5f5"
+       chipset="SKLGT4"
+       symbol_name="TestOa"
+       >
+    <counter name="TestCounter7"
+             description="HW test counter 7. Factor: 0.666"
+             data_type="uint64"
+             equation="B 7 READ"
+             underscore_name="counter7"
+             units="events"
+             symbol_name="Counter7"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="TestCounter8"
+             description="HW test counter 8. Should be equal to 1."
+             data_type="uint64"
+             equation="C 7 READ"
+             underscore_name="counter8"
+             units="events"
+             symbol_name="Counter8"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter4"
+             description="HW test counter 4. Factor: 0.333"
+             data_type="uint64"
+             equation="B 4 READ"
+             underscore_name="counter4"
+             units="events"
+             symbol_name="Counter4"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter5"
+             description="HW test counter 5. Factor: 0.333"
+             data_type="uint64"
+             equation="B 5 READ"
+             underscore_name="counter5"
+             units="events"
+             symbol_name="Counter5"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter6"
+             description="HW test counter 6. Factor: 0.166"
+             data_type="uint64"
+             equation="B 6 READ"
+             underscore_name="counter6"
+             units="events"
+             symbol_name="Counter6"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter3"
+             description="HW test counter 3. Factor: 0.5"
+             data_type="uint64"
+             equation="B 3 READ"
+             underscore_name="counter3"
+             units="events"
+             symbol_name="Counter3"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter0"
+             description="HW test counter 0. Factor: 0.0"
+             data_type="uint64"
+             equation="B 0 READ"
+             underscore_name="counter0"
+             units="events"
+             symbol_name="Counter0"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter1"
+             description="HW test counter 1. Factor: 1.0"
+             data_type="uint64"
+             equation="B 1 READ"
+             underscore_name="counter1"
+             units="events"
+             symbol_name="Counter1"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="TestCounter2"
+             description="HW test counter 2. Factor: 1.0"
+             data_type="uint64"
+             equation="B 2 READ"
+             underscore_name="counter2"
+             units="events"
+             symbol_name="Counter2"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x11810000" />
+        <register type="NOA" address="0x00009888" value="0x07810013" />
+        <register type="NOA" address="0x00009888" value="0x1F810000" />
+        <register type="NOA" address="0x00009888" value="0x1D810000" />
+        <register type="NOA" address="0x00009888" value="0x1B930040" />
+        <register type="NOA" address="0x00009888" value="0x07E54000" />
+        <register type="NOA" address="0x00009888" value="0x1F908000" />
+        <register type="NOA" address="0x00009888" value="0x11900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x53900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002744" value="0x00800000" />
+        <register type="OA" address="0x00002714" value="0xF0800000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0xF0800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002770" value="0x00000004" />
+        <register type="OA" address="0x00002774" value="0x00000000" />
+        <register type="OA" address="0x00002778" value="0x00000003" />
+        <register type="OA" address="0x0000277C" value="0x00000000" />
+        <register type="OA" address="0x00002780" value="0x00000007" />
+        <register type="OA" address="0x00002784" value="0x00000000" />
+        <register type="OA" address="0x00002788" value="0x00100002" />
+        <register type="OA" address="0x0000278C" value="0x0000FFF7" />
+        <register type="OA" address="0x00002790" value="0x00100002" />
+        <register type="OA" address="0x00002794" value="0x0000FFCF" />
+        <register type="OA" address="0x00002798" value="0x00100082" />
+        <register type="OA" address="0x0000279C" value="0x0000FFEF" />
+        <register type="OA" address="0x000027A0" value="0x001000C2" />
+        <register type="OA" address="0x000027A4" value="0x0000FFE7" />
+        <register type="OA" address="0x000027A8" value="0x00100001" />
+        <register type="OA" address="0x000027AC" value="0x0000FFE7" />
+    </register_config>
+  </set>
+
+  <set name="Metric set PMA Stall"
+       mdapi_supported_apis="OGL OGL4 OCL IO MEDIA"
+       underscore_name="pma__stall"
+       hw_config_guid="befe9fd6-474e-4a3d-b98e-cd793715cf91"
+       chipset="SKLGT4"
+       symbol_name="PMA_Stall"
+       >
+    <counter name="GPU Time Elapsed"
+             description="Time elapsed on the GPU during the measurement."
+             data_type="uint64"
+             equation="GPU_TIME 0 READ 1000000000 UMUL $GpuTimestampFrequency UDIV"
+             underscore_name="gpu_time"
+             units="ns"
+             symbol_name="GpuTime"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="GPU Core Clocks"
+             description="The total number of GPU core clocks elapsed during the measurement."
+             data_type="uint64"
+             equation="GPU_CLOCK 0 READ"
+             underscore_name="gpu_core_clocks"
+             units="cycles"
+             symbol_name="GpuCoreClocks"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Frame Batch Draw"
+             mdapi_hw_unit_type="gpu"
+             mdapi_group="GPU"
+             />
+    <counter name="STC PMA stall"
+             description="Percentage of time when stencil cache line and an overlapping pixel are causing stalls"
+             data_type="float"
+             max_equation="100"
+             equation="B 0 READ B 1 READ FADD 2 FDIV 100 UMUL $GpuCoreClocks FDIV"
+             underscore_name="stc_pma_stall"
+             units="percent"
+             symbol_name="StcPMAStall"
+             availability="$SliceMask 1 AND"
+             semantic_type="duration"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Frame Batch Draw"
+             mdapi_group="GPU/Stencil Cache"
+             mdapi_hw_unit_type="gpu"
+             />
+    <counter name="AVG GPU Core Frequency"
+             description="Average GPU Core Frequency in the measurement."
+             data_type="uint64"
+             max_equation="$GpuMaxFrequency"
+             equation="$GpuCoreClocks 1000000000 UMUL $GpuTime UDIV"
+             underscore_name="avg_gpu_core_frequency"
+             units="hz"
+             symbol_name="AvgGpuCoreFrequency"
+             semantic_type="event"
+             mdapi_supported_apis=""
+             mdapi_usage_flags="Tier1 Overview System Frame Batch Draw"
+             mdapi_group="GPU"
+             mdapi_hw_unit_type="gpu"
+             />
+    <register_config type="NOA">
+        <register type="NOA" address="0x00009840" value="0x00000080" />
+        <register type="NOA" address="0x00009888" value="0x122D3080" />
+        <register type="NOA" address="0x00009888" value="0x000D2000" />
+        <register type="NOA" address="0x00009888" value="0x060D8000" />
+        <register type="NOA" address="0x00009888" value="0x080DA000" />
+        <register type="NOA" address="0x00009888" value="0x0A0DA000" />
+        <register type="NOA" address="0x00009888" value="0x0C0F0800" />
+        <register type="NOA" address="0x00009888" value="0x0E0FAA00" />
+        <register type="NOA" address="0x00009888" value="0x100F0002" />
+        <register type="NOA" address="0x00009888" value="0x002D0025" />
+        <register type="NOA" address="0x00009888" value="0x062D1300" />
+        <register type="NOA" address="0x00009888" value="0x082D16A4" />
+        <register type="NOA" address="0x00009888" value="0x0A2D162E" />
+        <register type="NOA" address="0x00009888" value="0x102D0000" />
+        <register type="NOA" address="0x00009888" value="0x1190003F" />
+        <register type="NOA" address="0x00009888" value="0x51900000" />
+        <register type="NOA" address="0x00009888" value="0x41900000" />
+        <register type="NOA" address="0x00009888" value="0x55900000" />
+        <register type="NOA" address="0x00009888" value="0x45900000" />
+        <register type="NOA" address="0x00009888" value="0x47900000" />
+        <register type="NOA" address="0x00009888" value="0x57900000" />
+        <register type="NOA" address="0x00009888" value="0x49900000" />
+        <register type="NOA" address="0x00009888" value="0x37900000" />
+        <register type="NOA" address="0x00009888" value="0x33900000" />
+    </register_config>
+    <register_config type="OA">
+        <register type="OA" address="0x00002740" value="0x00000000" />
+        <register type="OA" address="0x00002710" value="0x00000000" />
+        <register type="OA" address="0x00002714" value="0x30800000" />
+        <register type="OA" address="0x00002720" value="0x00000000" />
+        <register type="OA" address="0x00002724" value="0x00800000" />
+        <register type="OA" address="0x00002770" value="0x00E00021" />
+        <register type="OA" address="0x00002774" value="0x0007FFF8" />
+        <register type="OA" address="0x00002778" value="0x07000101" />
+        <register type="OA" address="0x0000277C" value="0x0038FFC7" />
+    </register_config>
+  </set>
+
+</metrics>
diff --git a/lib/i915/perf-configs/perf-codegen.py b/lib/i915/perf-configs/perf-codegen.py
new file mode 100755
index 00000000..69502f9b
--- /dev/null
+++ b/lib/i915/perf-configs/perf-codegen.py
@@ -0,0 +1,854 @@
+#!/usr/bin/env python2
+#
+# Copyright (c) 2015-2018 Intel Corporation
+#
+# Permission is hereby granted, free of charge, to any person obtaining a
+# copy of this software and associated documentation files (the "Software"),
+# to deal in the Software without restriction, including without limitation
+# the rights to use, copy, modify, merge, publish, distribute, sublicense,
+# and/or sell copies of the Software, and to permit persons to whom the
+# Software is furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice (including the next
+# paragraph) shall be included in all copies or substantial portions of the
+# Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+# FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
+# IN THE SOFTWARE.
+
+import argparse
+import os
+import sys
+import textwrap
+
+import xml.etree.cElementTree as et
+
+sys.dont_write_bytecode = True
+import codegen
+
+h = None
+c = None
+
+hashed_funcs = {}
+xml_equations = None
+
+def check_operand_type(set, arg):
+    if arg.isdigit():
+        return "\n<mn>" + arg + "</mn>"
+    elif arg[0] == "$":
+        if arg in set.counter_vars:
+            description = set.counter_vars[arg].get('description')
+        elif arg in hw_vars and 'desc' in hw_vars[arg]:
+            description = hw_vars[arg]['desc'];
+        else:
+            description = None
+
+        if description != None:
+            return "\n<maction actiontype='tooltip'>\n<mi>" + arg + "</mi>\n<mtext>" + description + "</mtext>\n</maction>"
+        else:
+            return "<mi>" + arg + "</mi>"
+    return arg
+
+# http://en.cppreference.com/w/c/language/operator_precedence
+and_precedence = 8
+shft_precedence = 5
+mul_precedence = 3
+add_precedence = 2
+sub_precedence = 2
+default_precedence = 16 #a high value which denotes no brackets needed
+
+def put_brackets(arg):
+    return "\n<mtext>(</mtext>" + arg + "\n<mtext>)</mtext>"
+
+def mathml_splice_add(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < add_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < add_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo>+</mo>" + operand_0, add_precedence]
+
+def mathml_splice_div(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    return ["\n<mfrac>\n<mrow>" + operand_1 + "\n</mrow>\n<mrow>" + operand_0 + "</mrow>\n</mfrac>", default_precedence]
+
+def mathml_splice_max(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    return ["\n<mtext>max ( </mtext>" + operand_1 + "\n<mtext> , </mtext>" + operand_0 + "\n<mtext> ) </mtext>", default_precedence]
+
+def mathml_splice_mul(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < mul_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < mul_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo>*</mo>" + operand_0, mul_precedence]
+
+def mathml_splice_sub(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < sub_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < sub_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo>-</mo>" + operand_0, sub_precedence]
+
+def mathml_splice_read(set, args):
+    return ["\n<maction actiontype='tooltip'>\n<mi>" + args[1][0] + args[0][0] + "</mi>\n<mtext>placeholder</mtext>\n</maction>", default_precedence]
+
+def mathml_splice_read_reg(set, args):
+    return ["\n<maction actiontype='tooltip'>\n<mi>" + args[0][0] + "</mi>\n<mtext>placeholder</mtext>\n</maction>", default_precedence]
+
+def mathml_splice_min(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    return ["\n<mtext>min ( </mtext>" + operand_1 + "\n<mtext> , </mtext>" + operand_0 + "\n<mtext> ) </mtext>", default_precedence]
+
+def mathml_splice_lshft(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < shft_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < shft_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo><<</mo>" + operand_0, shft_precedence]
+
+def mathml_splice_rshft(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < mul_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < mul_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo>>></mo>" + operand_0, mul_precedence]
+
+def mathml_splice_and(set, args):
+    operand_0 = check_operand_type(set, args[0][0])
+    operand_1 = check_operand_type(set, args[1][0])
+    if args[0][1] < and_precedence:
+        operand_0 = put_brackets(args[0][0])
+    if args[1][1] < and_precedence:
+        operand_1 = put_brackets(args[1][0])
+    return [operand_1 + "\n<mo>&</mo>" + operand_0, and_precedence]
+
+def emit_fadd(tmp_id, args):
+    c("double tmp{0} = {1} + {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+# Be careful to check for divide by zero...
+def emit_fdiv(tmp_id, args):
+    c("double tmp{0} = {1};".format(tmp_id, args[1]))
+    c("double tmp{0} = {1};".format(tmp_id + 1, args[0]))
+    c("double tmp{0} = tmp{1} ? tmp{2} / tmp{1} : 0;".format(tmp_id + 2, tmp_id + 1, tmp_id))
+    return tmp_id + 3
+
+def emit_fmax(tmp_id, args):
+    c("double tmp{0} = {1};".format(tmp_id, args[1]))
+    c("double tmp{0} = {1};".format(tmp_id + 1, args[0]))
+    c("double tmp{0} = MAX(tmp{1}, tmp{2});".format(tmp_id + 2, tmp_id, tmp_id + 1))
+    return tmp_id + 3
+
+def emit_fmul(tmp_id, args):
+    c("double tmp{0} = {1} * {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_fsub(tmp_id, args):
+    c("double tmp{0} = {1} - {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_read(tmp_id, args):
+    type = args[1].lower()
+    c("uint64_t tmp{0} = accumulator[metric_set->{1}_offset + {2}];".format(tmp_id, type, args[0]))
+    return tmp_id + 1
+
+def emit_read_reg(tmp_id, args):
+    c("uint64_t tmp{0} = 0;".format(tmp_id))
+    return tmp_id + 1
+
+def emit_uadd(tmp_id, args):
+    c("uint64_t tmp{0} = {1} + {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+# Be careful to check for divide by zero...
+def emit_udiv(tmp_id, args):
+    c("uint64_t tmp{0} = {1};".format(tmp_id, args[1]))
+    c("uint64_t tmp{0} = {1};".format(tmp_id + 1, args[0]))
+    c("uint64_t tmp{0} = tmp{1} ? tmp{2} / tmp{1} : 0;".format(tmp_id + 2, tmp_id + 1, tmp_id))
+    return tmp_id + 3
+
+def emit_umul(tmp_id, args):
+    c("uint64_t tmp{0} = {1} * {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_usub(tmp_id, args):
+    c("uint64_t tmp{0} = {1} - {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_umin(tmp_id, args):
+    c("uint64_t tmp{0} = MIN({1}, {2});".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_lshft(tmp_id, args):
+    c("uint64_t tmp{0} = {1} << {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_rshft(tmp_id, args):
+    c("uint64_t tmp{0} = {1} >> {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+def emit_and(tmp_id, args):
+    c("uint64_t tmp{0} = {1} & {2};".format(tmp_id, args[1], args[0]))
+    return tmp_id + 1
+
+ops = {}
+#                     (n operands, emitter1, emitter2)
+ops["FADD"]     = (2, emit_fadd, mathml_splice_add)
+ops["FDIV"]     = (2, emit_fdiv, mathml_splice_div)
+ops["FMAX"]     = (2, emit_fmax, mathml_splice_max)
+ops["FMUL"]     = (2, emit_fmul, mathml_splice_mul)
+ops["FSUB"]     = (2, emit_fsub, mathml_splice_sub)
+ops["READ"]     = (2, emit_read, mathml_splice_read)
+ops["READ_REG"] = (1, emit_read_reg, mathml_splice_read_reg)
+ops["UADD"]     = (2, emit_uadd, mathml_splice_add)
+ops["UDIV"]     = (2, emit_udiv, mathml_splice_div)
+ops["UMUL"]     = (2, emit_umul, mathml_splice_mul)
+ops["USUB"]     = (2, emit_usub, mathml_splice_sub)
+ops["UMIN"]     = (2, emit_umin, mathml_splice_min)
+ops["<<"]       = (2, emit_lshft, mathml_splice_lshft)
+ops[">>"]       = (2, emit_rshft, mathml_splice_rshft)
+ops["AND"]      = (2, emit_and, mathml_splice_and)
+
+def brkt(subexp):
+    if " " in subexp:
+        return "(" + subexp + ")"
+    else:
+        return subexp
+
+def splice_bitwise_and(args):
+    return brkt(args[1]) + " & " + brkt(args[0])
+
+def splice_logical_and(args):
+    return brkt(args[1]) + " && " + brkt(args[0])
+
+def splice_ult(args):
+    return brkt(args[1]) + " < " + brkt(args[0])
+
+def splice_ugte(args):
+    return brkt(args[1]) + " >= " + brkt(args[0])
+
+exp_ops = {}
+#                 (n operands, splicer)
+exp_ops["AND"]  = (2, splice_bitwise_and)
+exp_ops["UGTE"] = (2, splice_ugte)
+exp_ops["ULT"]  = (2, splice_ult)
+exp_ops["&&"]   = (2, splice_logical_and)
+
+
+hw_vars = {
+        "$EuCoresTotalCount": { 'c': "devinfo->n_eus", 'desc': "The total number of execution units" },
+        "$EuSlicesTotalCount": { 'c': "devinfo->n_eu_slices" },
+        "$EuSubslicesTotalCount": { 'c': "devinfo->n_eu_sub_slices" },
+        "$EuThreadsCount": { 'c': "devinfo->eu_threads_count" },
+        "$SliceMask": { 'c': "devinfo->slice_mask" },
+        "$SubsliceMask": { 'c': "devinfo->subslice_mask" },
+        "$GpuTimestampFrequency": { 'c': "devinfo->timestamp_frequency" },
+        "$GpuMinFrequency": { 'c': "devinfo->gt_min_freq" },
+        "$GpuMaxFrequency": { 'c': "devinfo->gt_max_freq" },
+        "$SkuRevisionId": { 'c': "devinfo->revision" },
+        "$QueryMode": { 'c': "devinfo->query_mode" },
+}
+
+def splice_mathml_expression(set, equation, tag):
+    tokens = equation.split()
+    mathml_stack = []
+    tmp_xml_operand = ""
+    for token in tokens:
+        if not mathml_stack:
+            token = check_operand_type(set, token)
+        mathml_stack.append([token, default_precedence])
+        while mathml_stack and mathml_stack[-1][0] in ops:
+            op = mathml_stack.pop()[0]
+            argc, callback, mathml_callback = ops[op]
+            xml_args = []
+            for i in range(0, argc):
+                xml_operand = mathml_stack.pop()
+                xml_args.append(xml_operand)
+            tmp_xml_operand = mathml_callback(set, xml_args)
+            mathml_stack.append(tmp_xml_operand)
+    xml_string = mathml_stack.pop()[0]
+    equation_descr = "<mi>" + tag + "</mi><mo> = </mo>"
+    return "<mathml_" + tag + ">" + equation_descr + xml_string + "</mathml_" + tag + ">"
+
+def output_rpn_equation_code(set, counter, equation):
+    c("/* RPN equation: " + equation + " */")
+    tokens = equation.split()
+    stack = []
+    tmp_id = 0
+    tmp = None
+
+    for token in tokens:
+        stack.append(token)
+        while stack and stack[-1] in ops:
+            op = stack.pop()
+            argc, callback, mathml_callback = ops[op]
+            args = []
+            for i in range(0, argc):
+                operand = stack.pop()
+                if operand[0] == "$":
+                    if operand in hw_vars:
+                        operand = hw_vars[operand]['c']
+                    elif operand in set.counter_vars:
+                        reference = set.counter_vars[operand]
+                        operand = set.read_funcs[operand[1:]] + "(devinfo, metric_set, accumulator)"
+                    else:
+                        raise Exception("Failed to resolve variable " + operand + " in equation " + equation + " for " + set.name + " :: " + counter.get('name'));
+                args.append(operand)
+
+            tmp_id = callback(tmp_id, args)
+
+            tmp = "tmp{0}".format(tmp_id - 1)
+            stack.append(tmp)
+
+    if len(stack) != 1:
+        raise Exception("Spurious empty rpn code for " + set.name + " :: " +
+                counter.get('name') + ".\nThis is probably due to some unhandled RPN function, in the equation \"" +
+                equation + "\"")
+
+    value = stack[-1]
+
+    if value in hw_vars:
+        value = hw_vars[value]['c']
+    if value in set.counter_vars:
+        value = set.read_funcs[value[1:]] + "(devinfo, metric_set, accumulator)"
+
+    c("\nreturn " + value + ";")
+
+def splice_rpn_expression(set, counter_name, expression):
+    tokens = expression.split()
+    stack = []
+
+    for token in tokens:
+        stack.append(token)
+        while stack and stack[-1] in exp_ops:
+            op = stack.pop()
+            argc, callback = exp_ops[op]
+            args = []
+            for i in range(0, argc):
+                operand = stack.pop()
+                if operand[0] == "$":
+                    if operand in hw_vars:
+                        operand = hw_vars[operand]['c']
+                    else:
+                        raise Exception("Failed to resolve variable " + operand + " in expression " + expression + " for " + set.name + " :: " + counter_name)
+                args.append(operand)
+
+            subexp = callback(args)
+
+            stack.append(subexp)
+
+    if len(stack) != 1:
+        raise Exception("Spurious empty rpn expression for " + set.name + " :: " +
+                counter_name + ".\nThis is probably due to some unhandled RPN operation, in the expression \"" +
+                expression + "\"")
+
+    return stack[-1]
+
+
+def data_type_to_ctype(ret_type):
+    if ret_type == "uint64":
+        return "uint64_t"
+    elif ret_type == "float":
+        return "double"
+    else:
+        raise Exception("Unhandled case for mapping \"" + ret_type + "\" to a C type")
+
+
+def output_counter_read(gen, set, counter):
+    c("\n")
+    c("/* {0} :: {1} */".format(set.name, counter.get('name')))
+
+    if counter.read_hash in hashed_funcs:
+        c("#define %s \\" % counter.read_sym)
+        c.indent(4)
+        c("%s" % hashed_funcs[counter.read_hash])
+        c.outdent(4)
+    else:
+        ret_type = counter.get('data_type')
+        ret_ctype = data_type_to_ctype(ret_type)
+        read_eq = counter.get('equation')
+
+        c("static " + ret_ctype)
+        c(counter.read_sym + "(const struct intel_perf_devinfo *devinfo,\n")
+        c.indent(len(counter.read_sym) + 1)
+        c("const struct intel_perf_metric_set *metric_set,\n")
+        c("uint64_t *accumulator)\n")
+        c.outdent(len(counter.read_sym) + 1)
+
+        c("{")
+        c.indent(4)
+
+        output_rpn_equation_code(set, counter, read_eq)
+
+        c.outdent(4)
+        c("}")
+
+        hashed_funcs[counter.read_hash] = counter.read_sym
+
+
+def output_counter_max(gen, set, counter):
+    max_eq = counter.get('max_equation')
+
+    if not max_eq or max_eq == "100":
+        return
+
+    c("\n")
+    c("/* {0} :: {1} */".format(set.name, counter.get('name')))
+
+    if counter.max_hash in hashed_funcs:
+        c("#define %s \\" % counter.max_sym)
+        c.indent(4)
+        c("%s" % hashed_funcs[counter.max_hash])
+        c.outdent(4)
+    else:
+        ret_type = counter.get('data_type')
+        ret_ctype = data_type_to_ctype(ret_type)
+
+        c("static " + ret_ctype)
+
+        c(counter.max_sym + "(const struct intel_perf_devinfo *devinfo,\n")
+        c.indent(len(counter.max_sym) + 1)
+        c("const struct intel_perf_metric_set *metric_set,\n")
+        c("uint64_t *accumulator)\n")
+        c.outdent(len(counter.max_sym) + 1)
+
+        c("{")
+        c.indent(4)
+
+        output_rpn_equation_code(set, counter, max_eq)
+
+        c.outdent(4)
+        c("}")
+
+        hashed_funcs[counter.max_hash] = counter.max_sym
+
+
+semantic_type_map = {
+    "duration": "raw",
+    "ratio": "event"
+    }
+
+def output_availability(set, availability, counter_name):
+    expression = splice_rpn_expression(set, counter_name, availability)
+    lines = expression.split(' && ')
+    n_lines = len(lines)
+    if n_lines == 1:
+        c("if (" + lines[0] + ") {")
+    else:
+        c("if (" + lines[0] + " &&")
+        c.indent(4)
+        for i in range(1, (n_lines - 1)):
+            c(lines[i] + " &&")
+        c(lines[(n_lines - 1)] + ") {")
+        c.outdent(4)
+
+
+def output_units(unit):
+    return unit.replace(' ', '_').upper()
+
+
+def output_counter_report(set, counter):
+    data_type = counter.get('data_type')
+    data_type_uc = data_type.upper()
+    c_type = data_type
+
+    if "uint" in c_type:
+        c_type = c_type + "_t"
+
+    semantic_type = counter.get('semantic_type')
+    if semantic_type in semantic_type_map:
+        semantic_type = semantic_type_map[semantic_type]
+
+    semantic_type_uc = semantic_type.upper()
+
+    c("\n")
+
+    availability = counter.get('availability')
+    if availability:
+        output_availability(set, availability, counter.get('name'))
+        c.indent(4)
+
+    c("counter = &metric_set->counters[metric_set->n_counters++];\n")
+    c("counter->metric_set = metric_set;\n")
+    c("counter->name = \"{0}\";\n".format(counter.get('name')))
+    c("counter->symbol_name = \"{0}\";\n".format(counter.get('symbol_name')));
+    c("counter->desc = \"{0}\";\n".format(counter.get('description')))
+    c("counter->type = INTEL_PERF_LOGICAL_COUNTER_TYPE_{0};\n".format(semantic_type_uc))
+    c("counter->storage = INTEL_PERF_LOGICAL_COUNTER_STORAGE_{0};\n".format(data_type_uc))
+    c("counter->unit = INTEL_PERF_LOGICAL_COUNTER_UNIT_{0};\n".format(output_units(counter.get('units'))))
+    c("counter->read_{0} = {1};\n".format(data_type, set.read_funcs[counter.get('symbol_name')]))
+    c("counter->max_{0} = {1};\n".format(data_type, set.max_funcs[counter.get('symbol_name')]))
+    c("intel_perf_add_logical_counter(perf, counter, \"{0}\");\n".format(counter.get('mdapi_group')))
+
+    if availability:
+        c.outdent(4)
+        c("}\n")
+
+
+def generate_register_configs(set):
+    register_types = {
+        'FLEX': 'flex_regs',
+        'NOA': 'mux_regs',
+        'OA': 'b_counter_regs',
+    }
+
+    # allocate memory
+    total_n_registers = {}
+    register_configs = set.findall('register_config')
+    for register_config in register_configs:
+        t = register_types[register_config.get('type')]
+        if t not in total_n_registers:
+            total_n_registers[t] = len(register_config.findall('register'))
+        else:
+            total_n_registers[t] += len(register_config.findall('register'))
+
+    for reg in total_n_registers:
+        c("metric_set->{0} = calloc({1}, sizeof(struct intel_perf_register_prog));".format(reg, total_n_registers[reg]))
+    c("\n")
+
+    # fill in register/values
+    register_configs = set.findall('register_config')
+    for register_config in register_configs:
+        t = register_types[register_config.get('type')]
+
+        availability = register_config.get('availability')
+        if availability:
+            output_availability(set, availability, register_config.get('type') + ' register config')
+            c.indent(4)
+
+        for register in register_config.findall('register'):
+            c("metric_set->%s[metric_set->n_%s++] = (struct intel_perf_register_prog) { .reg = %s, .val = %s };" %
+              (t, t, register.get('address'), register.get('value')))
+
+        if availability:
+            c.outdent(4)
+            c("}")
+        c("\n")
+
+#
+
+class Counter:
+    def __init__(self, set, xml):
+        self.xml = xml
+        self.set = set
+        self.read_hash = None
+        self.max_hash = None
+
+        self.read_sym = "{0}__{1}__{2}__read".format(self.set.gen.chipset,
+                                                     self.set.underscore_name,
+                                                     self.xml.get('underscore_name'))
+
+        max_eq = self.xml.get('max_equation')
+        if not max_eq:
+            self.max_sym = "NULL /* undefined */"
+        elif max_eq == "100":
+            self.max_sym = "percentage_max_callback_" + self.xml.get('data_type')
+        else:
+            self.max_sym = "{0}__{1}__{2}__max".format(self.set.gen.chipset,
+                                                       self.set.underscore_name,
+                                                       self.xml.get('underscore_name'))
+
+    def get(self, prop):
+        return self.xml.get(prop)
+
+    def compute_hashes(self):
+        if self.read_hash is not None:
+            return
+
+        def replace_func(token):
+            if token[0] != "$":
+                return token
+            if token not in self.set.counter_vars:
+                return token
+            self.set.counter_vars[token].compute_hashes()
+            return self.set.counter_vars[token].read_hash
+
+        read_eq = self.xml.get('equation')
+        self.read_hash = ' '.join(map(replace_func, read_eq.split()))
+
+        max_eq = self.xml.get('max_equation')
+        if max_eq:
+            self.max_hash = ' '.join(map(replace_func, max_eq.split()))
+
+
+class Set:
+    def __init__(self, gen, xml):
+        self.gen = gen
+        self.xml = xml
+
+        self.counter_vars = {}
+        self.max_funcs = {}
+        self.read_funcs = {}
+        self.counter_hashes = {}
+
+        self.counters = []
+        xml_counters = self.xml.findall("counter")
+        for xml_counter in xml_counters:
+            counter = Counter(self, xml_counter)
+            self.counters.append(counter)
+            self.counter_vars["$" + counter.get('symbol_name')] = counter
+            self.max_funcs[counter.get('symbol_name')] = counter.max_sym
+            self.read_funcs[counter.get('symbol_name')] = counter.read_sym
+
+        for counter in self.counters:
+            counter.compute_hashes()
+
+    @property
+    def hw_config_guid(self):
+        return self.xml.get('hw_config_guid')
+
+    @property
+    def name(self):
+        return self.xml.get('name')
+
+    @property
+    def symbol_name(self):
+        return self.xml.get('symbol_name')
+
+    @property
+    def underscore_name(self):
+        return self.xml.get('underscore_name')
+
+    def findall(self, path):
+        return self.xml.findall(path)
+
+    def find(self, path):
+        return self.xml.find(path)
+
+
+class Gen:
+    def __init__(self, filename):
+        self.filename = filename
+        self.xml = et.parse(self.filename)
+        self.chipset = self.xml.find('.//set').get('chipset').lower()
+        self.sets = []
+
+        for xml_set in self.xml.findall(".//set"):
+            self.sets.append(Set(self, xml_set))
+
+
+def main():
+    global c
+    global h
+    global xml_equations
+
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--header", help="Header file to write")
+    parser.add_argument("--code", help="C file to write")
+    parser.add_argument("--xml-out", help="Output XML files (adding mathml equations)")
+    parser.add_argument("xml_files", nargs='+', help="List of xml metrics files to process")
+
+    args = parser.parse_args()
+
+    # Note: either arg may == None
+    h = codegen.Codegen(args.header)
+    c = codegen.Codegen(args.code)
+
+    gens = []
+    for xml_file in args.xml_files:
+        gens.append(Gen(xml_file))
+
+    if args.xml_out:
+        for gen in gens:
+            for set in gen.sets:
+                for counter in set.counters:
+                    xml_equation = splice_mathml_expression(set, counter.get('equation'), "EQ")
+                    counter.append(et.fromstring(xml_equation))
+            gen.xml.write(gen.filename)
+
+
+    copyright = textwrap.dedent("""\
+        /* Autogenerated file, DO NOT EDIT manually! generated by {}
+         *
+         * Copyright (c) 2018 Intel Corporation
+         *
+         * Permission is hereby granted, free of charge, to any person obtaining a
+         * copy of this software and associated documentation files (the "Software"),
+         * to deal in the Software without restriction, including without limitation
+         * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+         * and/or sell copies of the Software, and to permit persons to whom the
+         * Software is furnished to do so, subject to the following conditions:
+         *
+         * The above copyright notice and this permission notice (including the next
+         * paragraph) shall be included in all copies or substantial portions of the
+         * Software.
+         *
+         * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+         * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+         * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+         * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+         * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+         * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+         * DEALINGS IN THE SOFTWARE.
+         */
+
+        """).format(os.path.basename(__file__))
+
+    h(copyright)
+    c(copyright)
+    c(textwrap.dedent("""\
+        #include <stddef.h>
+        #include <stdint.h>
+        #include <stdbool.h>
+        #include <assert.h>
+
+        """))
+
+    c("#include \"" + os.path.basename(args.header) + "\"")
+
+    c(textwrap.dedent("""\
+        #include <stdlib.h>
+        #include <string.h>
+
+        #include "i915/perf.h"
+
+        #define MIN(x, y) (((x) < (y)) ? (x) : (y))
+        #define MAX(a, b) (((a) > (b)) ? (a) : (b))
+
+        static double
+        percentage_max_callback_float(const struct intel_perf_devinfo *devinfo,
+                                      const struct intel_perf_metric_set *metric_set,
+                                      uint64_t *accumulator)
+        {
+           return 100;
+        }
+
+        static uint64_t
+        percentage_max_callback_uint64(const struct intel_perf_devinfo *devinfo,
+                                       const struct intel_perf_metric_set *metric_set,
+                                       uint64_t *accumulator)
+        {
+           return 100;
+        }
+
+        """))
+
+    # Print out all equation functions.
+    for gen in gens:
+        for set in gen.sets:
+            for counter in set.counters:
+                output_counter_read(gen, set, counter)
+                output_counter_max(gen, set, counter)
+
+    # Print out all set registration functions for each set in each
+    # generation.
+    for gen in gens:
+        for set in gen.sets:
+            c("\nstatic void\n")
+            c(gen.chipset + "_add_" + set.underscore_name + "_metric_set(struct intel_perf *perf,")
+            c.indent(4)
+            c("const struct intel_perf_devinfo *devinfo)")
+            c.outdent(4)
+            c("{\n")
+            c.indent(4)
+
+            c("struct intel_perf_metric_set *metric_set;\n")
+            c("struct intel_perf_logical_counter *counter;\n\n")
+
+            counters = sorted(set.counters, key=lambda k: k.get('symbol_name'))
+
+            c("metric_set = calloc(1, sizeof(*metric_set));\n")
+            c("metric_set->name = \"" + set.name + "\";\n")
+            c("metric_set->symbol_name = \"" + set.symbol_name + "\";\n")
+            c("metric_set->hw_config_guid = \"" + set.hw_config_guid + "\";\n")
+            c("metric_set->counters = calloc({0}, sizeof(struct intel_perf_logical_counter));\n".format(str(len(counters))))
+            c("metric_set->n_counters = 0;\n")
+            c("metric_set->perf_oa_metrics_set = 0; // determined at runtime\n")
+
+            if gen.chipset == "hsw":
+                c(textwrap.dedent("""\
+                    metric_set->perf_oa_format = I915_OA_FORMAT_A45_B8_C8;
+
+                    metric_set->perf_raw_size = 256;
+                    metric_set->gpu_time_offset = 0;
+                    metric_set->a_offset = 1;
+                    metric_set->b_offset = metric_set->a_offset + 45;
+                    metric_set->c_offset = metric_set->b_offset + 8;
+
+                    """))
+            else:
+                c(textwrap.dedent("""\
+                    metric_set->perf_oa_format = I915_OA_FORMAT_A32u40_A4u32_B8_C8;
+
+                    metric_set->perf_raw_size = 256;
+                    metric_set->gpu_time_offset = 0;
+                    metric_set->gpu_clock_offset = 1;
+                    metric_set->a_offset = 2;
+                    metric_set->b_offset = metric_set->a_offset + 36;
+                    metric_set->c_offset = metric_set->b_offset + 8;
+
+                    """))
+
+            c("intel_perf_add_metric_set(perf, metric_set);");
+            c("\n")
+
+            generate_register_configs(set)
+
+            for counter in counters:
+                output_counter_report(set, counter)
+
+            c("\nassert(metric_set->n_counters <= {0});\n".format(len(counters)));
+
+            c.outdent(4)
+            c("}\n")
+
+    h(textwrap.dedent("""\
+        #pragma once
+
+        #include "i915/perf.h"
+
+        #ifdef __cplusplus
+        extern "C" {
+        #endif
+
+        """))
+
+    # Print out all set registration functions for each generation.
+    for gen in gens:
+        h("struct intel_perf *intel_perf_get_metrics_" + gen.chipset + "(const struct intel_perf_devinfo *devinfo);\n\n")
+
+        c("\nstruct intel_perf *")
+        c("intel_perf_get_metrics_" + gen.chipset + "(const struct intel_perf_devinfo *devinfo)")
+        c("{")
+        c.indent(4)
+
+        c("struct intel_perf *perf = intel_perf_new();\n")
+        c("\n")
+
+        for set in gen.sets:
+            c("{0}_add_{1}_metric_set(perf, devinfo);".format(gen.chipset, set.underscore_name))
+
+        c("\n")
+        c("return perf;")
+
+        c.outdent(4)
+        c("}")
+
+    h(textwrap.dedent("""\
+        #ifdef __cplusplus
+        } /* extern C */
+        #endif
+
+        """))
+
+
+if __name__ == '__main__':
+    main()
diff --git a/lib/i915/perf-configs/update-guids.py b/lib/i915/perf-configs/update-guids.py
new file mode 100755
index 00000000..51e73f1b
--- /dev/null
+++ b/lib/i915/perf-configs/update-guids.py
@@ -0,0 +1,230 @@
+#!/usr/bin/env python2
+# coding=utf-8
+
+# Copyright (C) 2016 Intel Corporation
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+# This script can:
+#
+# - Automatically add template entries for unregistered metric sets diescovered
+#   in new mdapi xml files.
+# - Once mdapi-convert-xml.py has been run to output register configs for new
+#   metric sets then re-running this script can add the config_hash attribute
+#   to corresponding registry entries.
+#
+# The script is designed to allow incremental updates/fixups of the guid
+# registry by working in terms of:
+#
+# 1) load all the existing state
+# 2) apply tweaks/modifications
+# 3) write everything back out
+#
+# The script should gracefully handle incomplete guid entries, which is
+# important when considering how the mdapi-xml-convert.py script depends on the
+# 'mdapi_config_hash' attribute while adding the 'config_hash' attribute
+# depends on the configs output by mdapi-xml-convert.py.
+
+
+
+import argparse
+import os.path
+import re
+import sys
+import time
+import uuid
+
+import xml.etree.ElementTree as et
+import xml.sax.saxutils as saxutils
+
+import pylibs.oa_guid_registry as oa_registry
+
+
+def print_err(*args):
+    sys.stderr.write(' '.join(map(str,args)) + '\n')
+
+def guid_hashing_key(guid_obj):
+    return oa_registry.Registry.chipset_derive_hash(guid_obj['chipset'],
+                                                    guid_obj['mdapi_config_hash'])
+
+parser = argparse.ArgumentParser()
+parser.add_argument("xml", nargs="+", help="XML description of metrics")
+parser.add_argument("--guids", required=True, help="Metric set GUID registry")
+
+args = parser.parse_args()
+
+
+guids = []
+guid_index = {} # guid objects indexed by id
+mdapi_config_hash_guid_table = {} # indexed by MDAPI XML register config hash
+named_guid_table = {} # indexed by name=<chipset>_<symbol_name>
+
+
+
+# 1) read everything we have currently
+#
+guids_xml = et.parse(args.guids)
+for guid in guids_xml.findall(".//guid"):
+    guid_obj = {}
+
+    if guid.get('id') != None:
+        guid_obj['id'] = guid.get('id')
+    else:
+        guid_obj['id'] = str(uuid.uuid4())
+
+    if guid.get('mdapi_config_hash') != None:
+        guid_obj['mdapi_config_hash'] = guid.get('mdapi_config_hash')
+    if guid.get('config_hash') != None:
+        guid_obj['config_hash'] = guid.get('config_hash')
+
+    if guid.get('chipset') != None:
+        guid_obj['chipset'] = guid.get('chipset')
+    if guid.get('name') != None:
+        guid_obj['name'] = guid.get('name')
+        named_guid_table[guid_obj['chipset'] + "_" + guid_obj['name']] = guid_obj
+
+    if 'mdapi_config_hash' in guid_obj:
+        hashing_key = oa_registry.Registry.chipset_derive_hash(guid_obj['chipset'],
+                                                               guid_obj['mdapi_config_hash'])
+        mdapi_config_hash_guid_table[hashing_key] = guid_obj
+
+    guids.append(guid_obj)
+
+    if guid_obj['id'] in guid_index:
+        print_err("Duplicate GUID " + guid_obj['id'] + "!")
+        sys.exit(1)
+    guid_index[guid_obj['id']] = guid_obj
+
+
+#
+# 2) fixup/modify the guid entries...
+#
+
+
+for arg in args.xml:
+    internal = et.parse(arg)
+
+    concurrent_group = internal.find(".//ConcurrentGroup")
+
+    for mdapi_set in internal.findall(".//MetricSet"):
+
+        mdapi_config_hash = oa_registry.Registry.mdapi_hw_config_hash(mdapi_set)
+
+        chipset = mdapi_set.get('SupportedHW').lower()
+        if concurrent_group.get('SupportedGT') != None:
+            chipset = chipset + concurrent_group.get('SupportedGT').lower()
+
+        set_name = mdapi_set.get('SymbolName')
+
+        name = chipset + "_" + set_name;
+
+        hashing_key = oa_registry.Registry.chipset_derive_hash(chipset, mdapi_config_hash)
+        if hashing_key in mdapi_config_hash_guid_table:
+            guid_obj = mdapi_config_hash_guid_table[hashing_key]
+
+            guid_obj['name'] = set_name
+            guid_obj['chipset'] = chipset
+            guid_obj['matched_mdapi'] = True
+        elif name in named_guid_table:
+            guid_obj = named_guid_table[name]
+
+            guid_obj['matched_mdapi'] = True
+            guid_obj['mdapi_config_hash'] = mdapi_config_hash
+            if 'config_hash' in guid_obj:
+                del guid_obj['config_hash']
+            guid_obj['comment'] = "WARNING: MDAPI XML config hash changed! If upstream, double check raw counter semantics unchanged"
+            print_err("WARNING: MDAPI XML config hash changed for \"" + set_name + "\" (" + chipset + ") If upstream, double check raw counter semantics unchanged")
+        else:
+            guid_obj = { 'mdapi_config_hash': mdapi_config_hash,
+                         'id': str(uuid.uuid4()),
+                         'name': set_name,
+                         'chipset': chipset,
+                         'unregistered': True,
+                         'matched_mdapi': True,
+                         'comment': "New"
+                       }
+            guid_index[guid_obj['id']] = guid_obj
+            mdapi_config_hash_guid_table[guid_hashing_key(guid_obj)] = guid_obj
+            guids.append(guid_obj)
+            print_err("New GUID \"" + guid_obj['id'] + "\" for metric set = " + set_name + " (" + chipset + ")")
+
+        named_guid_table[chipset + '_' + set_name] = guid_obj
+
+
+
+chipsets = [ 'hsw',
+             'bdw', 'chv',
+             'sklgt2', 'sklgt3', 'sklgt4', 'kblgt2', 'kblgt3', 'cflgt2', 'cflgt3',
+             'bxt', 'glk',
+             'cnl',
+             'icl' ]
+
+for chipset in chipsets:
+    filename = 'oa-' + chipset + '.xml'
+    if not os.path.isfile(filename):
+        continue
+
+    public = et.parse(filename)
+
+    for metricset in public.findall(".//set"):
+
+        set_name = metricset.get('symbol_name')
+
+        config_hash = oa_registry.Registry.hw_config_hash(metricset)
+
+        guid_key = chipset + "_" + set_name
+        if guid_key in named_guid_table:
+            guid_obj = named_guid_table[guid_key]
+            guid_obj['config_hash'] = config_hash
+
+
+#
+# 3) write all the guids back out...
+
+print("<guids>")
+for guid_obj in guids:
+    comment = None
+    line = "<guid"
+
+    if 'matched_mdapi' not in guid_obj:
+        comment = "Not found in MDAPI XML file[s]; Entry copied unmodified (maybe removed from MDAPI XML or not all files given on command line)"
+
+    if 'comment' in guid_obj:
+        comment = guid_obj['comment']
+
+    if 'config_hash' in guid_obj:
+        line = line + ' config_hash="' + guid_obj['config_hash'] + '"'
+    if 'mdapi_config_hash' in guid_obj:
+        line = line + ' mdapi_config_hash="' + guid_obj['mdapi_config_hash'] + '"'
+
+    line = line + ' id="' + guid_obj['id'] + '"'
+
+    if 'chipset' in guid_obj:
+        line = line + ' chipset="' + guid_obj['chipset'] + '"'
+
+    if 'name' in guid_obj:
+        line = line + ' name="' + guid_obj['name'] + '"'
+
+    line = line + ' />'
+
+    if comment != None:
+        print("    <!-- ↓" + comment + " -->")
+
+    print("    " + line)
+print("</guids>")
diff --git a/lib/i915/perf.c b/lib/i915/perf.c
new file mode 100644
index 00000000..1627f102
--- /dev/null
+++ b/lib/i915/perf.c
@@ -0,0 +1,194 @@
+/*
+ * Copyright (C) 2018 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to deal
+ * in the Software without restriction, including without limitation the rights
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ * SOFTWARE.
+ */
+
+#include <stdlib.h>
+#include <string.h>
+
+#include "intel_chipset.h"
+#include "perf.h"
+#include "i915_perf_metrics.h"
+
+struct intel_perf *
+intel_perf_for_devinfo(const struct intel_device_info *devinfo)
+{
+	struct intel_perf_devinfo gputop_devinfo = {};
+
+	if (devinfo->is_haswell)
+		return intel_perf_get_metrics_hsw(&gputop_devinfo);
+	if (devinfo->is_broadwell)
+		return intel_perf_get_metrics_bdw(&gputop_devinfo);
+	if (devinfo->is_cherryview)
+		return intel_perf_get_metrics_chv(&gputop_devinfo);
+	if (devinfo->is_skylake) {
+		switch (devinfo->gt) {
+		case 2:
+			return intel_perf_get_metrics_sklgt2(&gputop_devinfo);
+		case 3:
+			return intel_perf_get_metrics_sklgt3(&gputop_devinfo);
+		case 4:
+			return intel_perf_get_metrics_sklgt4(&gputop_devinfo);
+		default:
+			return NULL;
+		}
+	}
+	if (devinfo->is_broxton)
+		return intel_perf_get_metrics_bxt(&gputop_devinfo);
+	if (devinfo->is_kabylake) {
+		switch (devinfo->gt) {
+		case 2:
+			return intel_perf_get_metrics_kblgt2(&gputop_devinfo);
+		case 3:
+			return intel_perf_get_metrics_kblgt3(&gputop_devinfo);
+		default:
+			return NULL;
+		}
+	}
+	if (devinfo->is_geminilake)
+		return intel_perf_get_metrics_glk(&gputop_devinfo);
+	if (devinfo->is_coffeelake) {
+		switch (devinfo->gt) {
+		case 2:
+			return intel_perf_get_metrics_cflgt2(&gputop_devinfo);
+		case 3:
+			return intel_perf_get_metrics_cflgt3(&gputop_devinfo);
+		default:
+			return NULL;
+		}
+	}
+	if (devinfo->is_cannonlake)
+		return intel_perf_get_metrics_cnl(&gputop_devinfo);
+	if (devinfo->is_icelake)
+		return intel_perf_get_metrics_icl(&gputop_devinfo);
+	return NULL;
+}
+
+static struct intel_perf_logical_counter_group *
+intel_perf_logical_counter_group_new(struct intel_perf *perf,
+				     struct intel_perf_logical_counter_group *parent,
+				     const char *name)
+{
+	struct intel_perf_logical_counter_group *group = calloc(1, sizeof(*group));
+
+	group->name = strdup(name);
+
+	IGT_INIT_LIST_HEAD(&group->counters);
+	IGT_INIT_LIST_HEAD(&group->groups);
+
+	if (parent)
+		igt_list_add_tail(&group->link, &parent->groups);
+	else
+		IGT_INIT_LIST_HEAD(&group->link);
+
+	return group;
+}
+
+struct intel_perf *
+intel_perf_new(void)
+{
+	struct intel_perf *perf = calloc(1, sizeof(*perf));
+
+	perf->root_group = intel_perf_logical_counter_group_new(perf, NULL, "");
+
+	IGT_INIT_LIST_HEAD(&perf->metric_sets);
+
+	return perf;
+}
+
+static void
+intel_perf_logical_counter_group_free(struct intel_perf_logical_counter_group *group)
+{
+	struct intel_perf_logical_counter_group *child, *tmp;
+
+	igt_list_for_each_entry_safe(child, tmp, &group->groups, link) {
+		igt_list_del(&child->link);
+		intel_perf_logical_counter_group_free(child);
+	}
+
+	free(group->name);
+	free(group);
+}
+
+static void
+intel_perf_metric_set_free(struct intel_perf_metric_set *metric_set)
+{
+	free(metric_set->counters);
+	free(metric_set);
+}
+
+void
+intel_perf_free(struct intel_perf *perf)
+{
+	struct intel_perf_metric_set *metric_set, *tmp;
+
+	intel_perf_logical_counter_group_free(perf->root_group);
+
+	igt_list_for_each_entry_safe(metric_set, tmp, &perf->metric_sets, link) {
+		igt_list_del(&metric_set->link);
+		intel_perf_metric_set_free(metric_set);
+	}
+
+	free(perf);
+}
+
+void
+intel_perf_add_logical_counter(struct intel_perf *perf,
+			       struct intel_perf_logical_counter *counter,
+			       const char *group_path)
+{
+	const char *group_path_end = group_path + strlen(group_path);
+	struct intel_perf_logical_counter_group *group = perf->root_group, *child_group = NULL;
+	const char *name = group_path;
+
+	while (name < group_path_end) {
+		const char *name_end = strstr(name, "/");
+		char group_name[128] = { 0, };
+		struct intel_perf_logical_counter_group *iter_group;
+
+		if (!name_end)
+			name_end = group_path_end;
+
+		memcpy(group_name, name, name_end - name);
+
+		child_group = NULL;
+		igt_list_for_each_entry(iter_group, &group->groups, link) {
+			if (!strcmp(iter_group->name, group_name)) {
+				child_group = iter_group;
+				break;
+			}
+		}
+
+		if (!child_group)
+			child_group = intel_perf_logical_counter_group_new(perf, group, group_name);
+
+		name = name_end + 1;
+		group = child_group;
+	}
+
+	igt_list_add_tail(&counter->link, &child_group->counters);
+}
+
+void
+intel_perf_add_metric_set(struct intel_perf *perf,
+			  struct intel_perf_metric_set *metric_set)
+{
+	igt_list_add_tail(&metric_set->link, &perf->metric_sets);
+}
diff --git a/lib/i915/perf.h b/lib/i915/perf.h
new file mode 100644
index 00000000..5a091c46
--- /dev/null
+++ b/lib/i915/perf.h
@@ -0,0 +1,238 @@
+/*
+ * Copyright (C) 2015-2016 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to deal
+ * in the Software without restriction, including without limitation the rights
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ * SOFTWARE.
+ */
+
+#ifndef PERF_METRICS_H
+#define PERF_METRICS_H
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+#include <stdbool.h>
+#include <stdint.h>
+
+#include <i915_drm.h>
+
+#include "igt_list.h"
+
+struct intel_device_info;
+
+struct intel_perf_devinfo {
+	char devname[20];
+	char prettyname[100];
+
+	/*
+	 * Always false for gputop, we don't have the additional
+	 * snapshots of register values, only the OA reports.
+	 */
+	bool query_mode;
+
+	bool has_dynamic_configs;
+
+	struct {
+		uint32_t max_slices;
+		uint32_t max_subslices;
+		uint32_t max_eus_per_subslice;
+		uint32_t n_threads_per_eu;
+
+		/*
+		 * Max values should be enough for a while (famous
+		 * last words...).
+		 */
+		uint8_t slices_mask[1];
+		uint8_t subslices_mask[10];
+		uint8_t eus_mask[128];
+	} topology;
+
+	/* The following fields are prepared for equations from the XML files.
+	 * Their values are build up from the topology fields.
+	 */
+	uint32_t devid;
+	uint32_t gen;
+	uint32_t revision;
+	uint64_t timestamp_frequency;
+	uint64_t gt_min_freq;
+	uint64_t gt_max_freq;
+
+	uint64_t n_eus;
+	uint64_t n_eu_slices;
+	uint64_t n_eu_sub_slices;
+	uint64_t subslice_mask;
+	uint64_t slice_mask;
+	uint64_t eu_threads_count;
+};
+
+typedef enum {
+	INTEL_PERF_LOGICAL_COUNTER_STORAGE_UINT64,
+	INTEL_PERF_LOGICAL_COUNTER_STORAGE_UINT32,
+	INTEL_PERF_LOGICAL_COUNTER_STORAGE_DOUBLE,
+	INTEL_PERF_LOGICAL_COUNTER_STORAGE_FLOAT,
+	INTEL_PERF_LOGICAL_COUNTER_STORAGE_BOOL32,
+} intel_perf_logical_counter_storage_t;
+
+typedef enum {
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_RAW,
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_DURATION_RAW,
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_DURATION_NORM,
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_EVENT,
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_THROUGHPUT,
+	INTEL_PERF_LOGICAL_COUNTER_TYPE_TIMESTAMP,
+} intel_perf_logical_counter_type_t;
+
+typedef enum {
+	/* size */
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_BYTES,
+
+	/* frequency */
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_HZ,
+
+	/* time */
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_NS,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_US,
+
+	/**/
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_PIXELS,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_TEXELS,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_THREADS,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_PERCENT,
+
+	/* events */
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_MESSAGES,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_NUMBER,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_CYCLES,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_EVENTS,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_UTILIZATION,
+
+	/**/
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_EU_SENDS_TO_L3_CACHE_LINES,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_EU_ATOMIC_REQUESTS_TO_L3_CACHE_LINES,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_EU_REQUESTS_TO_L3_CACHE_LINES,
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_EU_BYTES_PER_L3_CACHE_LINE,
+
+	INTEL_PERF_LOGICAL_COUNTER_UNIT_MAX
+} intel_perf_logical_counter_unit_t;
+
+#define OAREPORT_REASON_MASK           0x3f
+#define OAREPORT_REASON_SHIFT          19
+#define OAREPORT_REASON_TIMER          (1<<0)
+#define OAREPORT_REASON_CTX_SWITCH     (1<<3)
+
+struct intel_perf_metric_set;
+struct intel_perf_logical_counter {
+	const struct intel_perf_metric_set *metric_set;
+	const char *name;
+	const char *symbol_name;
+	const char *desc;
+	intel_perf_logical_counter_storage_t storage;
+	intel_perf_logical_counter_type_t type;
+	intel_perf_logical_counter_unit_t unit;
+	union {
+		uint64_t (*max_uint64)(const struct intel_perf_devinfo *devinfo,
+				       const struct intel_perf_metric_set *metric_set,
+				       uint64_t *deltas);
+		double (*max_float)(const struct intel_perf_devinfo *devinfo,
+				    const struct intel_perf_metric_set *metric_set,
+				    uint64_t *deltas);
+	};
+
+	union {
+		uint64_t (*read_uint64)(const struct intel_perf_devinfo *devinfo,
+					const struct intel_perf_metric_set *metric_set,
+					uint64_t *deltas);
+		double (*read_float)(const struct intel_perf_devinfo *devinfo,
+				     const struct intel_perf_metric_set *metric_set,
+				     uint64_t *deltas);
+	};
+
+	struct igt_list_head link; /* list from intel_perf_logical_counter_group.counters */
+};
+
+struct intel_perf_register_prog {
+	uint32_t reg;
+	uint32_t val;
+};
+
+struct intel_perf_metric_set {
+	const char *name;
+	const char *symbol_name;
+	const char *hw_config_guid;
+
+	struct intel_perf_logical_counter *counters;
+	int n_counters;
+
+	uint64_t perf_oa_metrics_set;
+	int perf_oa_format;
+	int perf_raw_size;
+
+	/* For indexing into accumulator->deltas[] ... */
+	int gpu_time_offset;
+	int gpu_clock_offset;
+	int a_offset;
+	int b_offset;
+	int c_offset;
+
+	struct intel_perf_register_prog *b_counter_regs;
+	uint32_t n_b_counter_regs;
+
+	struct intel_perf_register_prog *mux_regs;
+	uint32_t n_mux_regs;
+
+	struct intel_perf_register_prog *flex_regs;
+	uint32_t n_flex_regs;
+
+	struct igt_list_head link;
+};
+
+/* A tree structure with group having subgroups and counters. */
+struct intel_perf_logical_counter_group {
+	char *name;
+
+	struct igt_list_head counters;
+	struct igt_list_head groups;
+
+	struct igt_list_head link;  /* link for intel_perf_logical_counter_group.groups */
+};
+
+struct intel_perf {
+	const char *name;
+
+	struct intel_perf_logical_counter_group *root_group;
+
+	struct igt_list_head metric_sets;
+};
+
+struct intel_perf *intel_perf_for_devinfo(const struct intel_device_info *devinfo);
+struct intel_perf *intel_perf_new(void);
+void intel_perf_free(struct intel_perf *perf);
+
+void intel_perf_add_logical_counter(struct intel_perf *perf,
+				    struct intel_perf_logical_counter *counter,
+				    const char *group);
+
+void intel_perf_add_metric_set(struct intel_perf *perf,
+			       struct intel_perf_metric_set *metric_set);
+
+#ifdef __cplusplus
+};
+#endif
+
+#endif /* PERF_METRICS_H */
diff --git a/lib/meson.build b/lib/meson.build
index e87e5803..edff8a67 100644
--- a/lib/meson.build
+++ b/lib/meson.build
@@ -170,4 +170,68 @@ lib_igt_perf_build = static_library('igt_perf',
 lib_igt_perf = declare_dependency(link_with : lib_igt_perf_build,
 				  include_directories : inc)
 
+
+i915_perf_files = [
+  'i915/perf.c',
+]
+
+i915_perf_hardware = [
+  'hsw',
+  'bdw', 'chv',
+  'sklgt2', 'sklgt3', 'sklgt4',
+  'kblgt2', 'kblgt3',
+  'cflgt2', 'cflgt3',
+  'bxt', 'glk',
+  'cnl',
+  'icl'
+]
+
+i915_xml_files = []
+foreach hw : i915_perf_hardware
+  i915_xml_files += 'i915/perf-configs/oa- at 0@.xml'.format(hw)
+endforeach
+
+i915_perf_files += custom_target(
+  'i915-perf-metrics',
+  input : i915_xml_files,
+  output : [ 'i915_perf_metrics.c', 'i915_perf_metrics.h' ],
+  command : [
+    find_program('i915/perf-configs/perf-codegen.py'),
+    '--code', '@OUTPUT0@',
+    '--header', '@OUTPUT1@',
+    '@INPUT@',
+  ])
+
+lib_igt_i915_perf_build = shared_library(
+  'i915_perf',
+  i915_perf_files,
+  dependencies: [ lib_igt, lib_igt_chipset ],
+  include_directories : inc,
+  install: true)
+
+lib_igt_i915_perf = declare_dependency(
+  link_with : lib_igt_i915_perf_build,
+  include_directories : inc)
+
+install_headers(
+  'igt_list.h',
+  'intel_chipset.h',
+  'i915/perf.h',
+  subdir : 'i915-perf'
+)
+
+pkgconf = configuration_data()
+
+pkgconf.set('prefix', get_option('prefix'))
+pkgconf.set('exec_prefix', '${prefix}')
+pkgconf.set('libdir', '${prefix}/@0@'.format(get_option('libdir')))
+pkgconf.set('includedir', '${prefix}/@0@/i915-perf'.format(get_option('includedir')))
+pkgconf.set('version', meson.project_version())
+
+configure_file(
+  input : 'i915-perf.pc.in',
+  output : 'i915-perf.pc',
+  configuration : pkgconf,
+  install_dir : pkgconfigdir)
+
 subdir('tests')
diff --git a/tools/i915-perf/i915_perf_configs.c b/tools/i915-perf/i915_perf_configs.c
new file mode 100644
index 00000000..eeb32a53
--- /dev/null
+++ b/tools/i915-perf/i915_perf_configs.c
@@ -0,0 +1,277 @@
+/*
+ * Copyright (C) 2018 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to deal
+ * in the Software without restriction, including without limitation the rights
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ * SOFTWARE.
+ */
+
+#include <assert.h>
+#include <dirent.h>
+#include <errno.h>
+#include <fcntl.h>
+#include <getopt.h>
+#include <inttypes.h>
+#include <stdbool.h>
+#include <stdint.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <sys/ioctl.h>
+#include <sys/sysmacros.h>
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <unistd.h>
+
+#include <i915_drm.h>
+
+#include "intel_chipset.h"
+#include "i915/perf.h"
+
+static bool
+read_file_uint64(const char *file, uint64_t *value)
+{
+	char buf[32];
+	int fd, n;
+
+	fd = open(file, 0);
+	if (fd < 0)
+		return false;
+	n = read(fd, buf, sizeof (buf) - 1);
+	close(fd);
+	if (n < 0)
+		return false;
+
+	buf[n] = '\0';
+	*value = strtoull(buf, 0, 0);
+
+	return true;
+}
+
+static uint32_t
+read_device_param(const char *stem, int id, const char *param)
+{
+	char *name;
+	int ret = asprintf(&name, "/sys/class/drm/%s%u/device/%s", stem, id, param);
+	uint64_t value;
+	bool success;
+
+	assert(ret != -1);
+
+	success = read_file_uint64(name, &value);
+	free(name);
+
+	return success ? value : 0;
+}
+
+static int
+find_intel_render_node(void)
+{
+	for (int i = 128; i < (128 + 16); i++) {
+		if (read_device_param("renderD", i, "vendor") == 0x8086)
+			return i;
+	}
+
+	return -1;
+}
+
+static int
+open_render_node(uint32_t *devid)
+{
+	char *name;
+	int ret;
+	int fd;
+
+	int render = find_intel_render_node();
+	if (render < 0)
+		return -1;
+
+	ret = asprintf(&name, "/dev/dri/renderD%u", render);
+	assert(ret != -1);
+
+	*devid = read_device_param("renderD", render, "device");
+
+	fd = open(name, O_RDWR);
+	free(name);
+
+	return fd;
+}
+
+static int
+get_card_for_fd(int fd)
+{
+	struct stat sb;
+	int mjr, mnr;
+	char buffer[128];
+	DIR *drm_dir;
+	struct dirent *entry;
+	int retval = -1;
+
+	if (fstat(fd, &sb)) {
+		fprintf(stderr, "Failed to stat DRM fd\n");
+		return -1;
+	}
+
+	mjr = major(sb.st_rdev);
+	mnr = minor(sb.st_rdev);
+
+	snprintf(buffer, sizeof(buffer), "/sys/dev/char/%d:%d/device/drm", mjr, mnr);
+
+	drm_dir = opendir(buffer);
+	assert(drm_dir != NULL);
+
+	while ((entry = readdir(drm_dir))) {
+		if (entry->d_type == DT_DIR && strncmp(entry->d_name, "card", 4) == 0) {
+			retval = strtoull(entry->d_name + 4, NULL, 10);
+			break;
+		}
+	}
+
+	closedir(drm_dir);
+
+	return retval;
+}
+
+static int
+perf_ioctl(int fd, unsigned long request, void *arg)
+{
+	int ret;
+
+	do {
+		ret = ioctl(fd, request, arg);
+	} while (ret == -1 && (errno == EINTR || errno == EAGAIN));
+
+	return ret;
+}
+
+static const char *
+metric_name(struct intel_perf *perf, const char *hw_config_guid)
+{
+	struct intel_perf_metric_set *metric_set;
+
+	igt_list_for_each_entry(metric_set, &perf->metric_sets, link) {
+		if (!strcmp(metric_set->hw_config_guid, hw_config_guid))
+			return metric_set->symbol_name;
+	}
+
+	return "Unknown";
+}
+
+static void
+usage(void)
+{
+	printf("Usage: i915-perf-configs [options]\n"
+	       "\n"
+	       "     --purge, -p         Purge configurations from the kernel\n"
+	       "     --list, -l          List configurations from the kernel\n");
+}
+
+int
+main(int argc, char *argv[])
+{
+	char metrics_path[128];
+	DIR *metrics_dir;
+	struct dirent *entry;
+	int drm_fd, drm_card;
+	int opt;
+	bool purge = false;
+	const struct option long_options[] = {
+		{"help",   no_argument, 0, 'h'},
+		{"list",   no_argument, 0, 'l'},
+		{"purge",  no_argument, 0, 'p'},
+		{0, 0, 0, 0}
+	};
+	const struct intel_device_info *devinfo;
+	struct intel_perf *perf;
+	uint32_t devid = 0;
+
+	while ((opt = getopt_long(argc, argv, "hlp", long_options, NULL)) != -1) {
+		switch (opt) {
+		case 'h':
+			usage();
+			return EXIT_SUCCESS;
+		case 'l':
+			break;
+		case 'p':
+			purge = true;
+			break;
+		default:
+			fprintf(stderr, "Internal error: "
+				"unexpected getopt value: %d\n", opt);
+			usage();
+			return EXIT_FAILURE;
+		}
+	}
+
+	drm_fd = open_render_node(&devid);
+	drm_card = get_card_for_fd(drm_fd);
+
+	fprintf(stdout, "Found device id=0x%x\n", devid);
+
+	devinfo = intel_get_device_info(devid);
+	if (!devinfo) {
+		fprintf(stderr, "No device info found.\n");
+		return EXIT_FAILURE;
+	}
+
+	fprintf(stdout, "Device gen=%i gt=%i\n", devinfo->gen, devinfo->gt);
+
+	perf = intel_perf_for_devinfo(devinfo);
+	if (!perf) {
+		fprintf(stderr, "No perf data found.\n");
+		return EXIT_FAILURE;
+	}
+
+	snprintf(metrics_path, sizeof(metrics_path),
+		 "/sys/class/drm/card%d/metrics", drm_card);
+	metrics_dir = opendir(metrics_path);
+	if (!metrics_dir)
+		return EXIT_FAILURE;
+
+	fprintf(stdout, "Looking at metrics in %s\n", metrics_path);
+
+	while ((entry = readdir(metrics_dir))) {
+		char metric_id_path[400];
+		uint64_t metric_id;
+
+		if (entry->d_type != DT_DIR)
+			continue;
+
+		snprintf(metric_id_path, sizeof(metric_id_path),
+			 "%s/%s/id", metrics_path, entry->d_name);
+
+		if (!read_file_uint64(metric_id_path, &metric_id))
+			continue;
+
+		if (purge) {
+			if (perf_ioctl(drm_fd, DRM_IOCTL_I915_PERF_REMOVE_CONFIG, &metric_id) == 0)
+				fprintf(stdout, "\tRemoved config %s id=%03" PRIu64 " name=%s\n",
+					entry->d_name, metric_id, metric_name(perf, entry->d_name));
+			else
+				fprintf(stdout, "\tFailed to remove config %s id=%03" PRIu64 " name=%s\n",
+					entry->d_name, metric_id, metric_name(perf, entry->d_name));
+		} else {
+			fprintf(stdout, "\tConfig %s id=%03" PRIu64 " name=%s\n",
+				entry->d_name, metric_id, metric_name(perf, entry->d_name));
+		}
+	}
+
+	closedir(metrics_dir);
+	close(drm_fd);
+
+	return EXIT_SUCCESS;
+}
diff --git a/tools/i915-perf/meson.build b/tools/i915-perf/meson.build
new file mode 100644
index 00000000..0ebdd185
--- /dev/null
+++ b/tools/i915-perf/meson.build
@@ -0,0 +1,5 @@
+executable('i915-perf-configs',
+           [ 'i915_perf_configs.c' ],
+           include_directories: inc,
+           dependencies: [lib_igt_chipset, lib_igt_i915_perf],
+           install: true)
diff --git a/tools/meson.build b/tools/meson.build
index cf3f37b2..59b56d5d 100644
--- a/tools/meson.build
+++ b/tools/meson.build
@@ -100,4 +100,5 @@ executable('amd_hdmi_compliance', 'amd_hdmi_compliance.c',
 	   install_rpath : bindir_rpathdir,
 	   install : true)
 
+subdir('i915-perf')
 subdir('null_state_gen')
-- 
2.20.1



More information about the igt-dev mailing list